@book{Whitehorn:2005:FTM:1098716,
 author = {Whitehorn, Mark and Zare, Robert and Pasumansky, Mosha},
 title = {Fast Track to MDX},
 year = {2005},
 isbn = {1846281741},
 publisher = {Springer-Verlag New York, Inc.},
 address = {Secaucus, NJ, USA},
} 

@inproceedings{110450,
 author = {Sun, Xian-He and Ni, Lionel M.},
 title = {Another view on parallel speedup},
 booktitle = {Supercomputing '90: Proceedings of the 1990 ACM/IEEE conference on Supercomputing},
 year = {1990},
 isbn = {0-89791-412-0},
 pages = {324--333},
 location = {New York, New York, United States},
 publisher = {IEEE Computer Society Press},
 address = {Los Alamitos, CA, USA},
 }


@Unpublished{920347-LbONsx,
  author =       "K. Wu and Kurt Stockinger and Arie Shoshani",
  title =        "Performance of Multi-Level and Multi-Component Compressed Bitmap Indexes",
  note =         "available from
                \url{http://www.osti.gov/bridge/servlets/purl/920347-LbONsx/}",
  year =         2007
}

@article{wu2006obi,
  title =        "Optimizing bitmap indices with efficient
                  compression",
  author =       "Wu, K. and Otoo, E. J. and Shoshani, A.",
  journal =      "ACM Transactions on Database Systems",
  volume =       "31",
  number =       "1",
  pages =        "1--38",
  year =         "2006",
  publisher =    {ACM Press New York, NY, USA}
}

@phdthesis{hazel-thesis,
title={Properties and Applications of Diamond Cubes},
author={Hazel Webb},
school={University of New Brunswick Saint John},
year={2010}
}

@techreport{andrew-thesis,
title={ Diamond Dicing},
author={Andrew Albert},
institution={University of New Brunswick Saint John},
year={2006},
type ={Honours Thesis},
}

@article{indus-script,
title={A Markov Model of the Indus Script},
author={ Rajesh P. N. Raoa and  Nisha Yadavb and  Mayank N. Vahiab and  Hrishikesh Joglekard and  R. Adhikarie  Iravatham Mahadevanf},
journal={Proceedings of the National Academy of Sciences of the United States of America},
doi={10.1073/pnas.0906237106 },
howpublished={\url{http://www.pnas.org/content/early/2009/08/04/0906237106.abstract}},
year={2009},
}

@MastersThesis{richard-thesis,
title={Simplifying Parallel Datacube Computation},
author={Richard X. Liu},
year = 2002,
school = 	 {University of New Brunswick}}

@book{factor-analysis,
author={Rummel, R.J.},
title={Applied Factor Analysis},
publisher={Northwestern University Press},
year={1970},
isbn={0-8101-0254-4},
}

@inbook{biomed-abstract-classification,
author={Alexandre Kouznetsov and  Stan Matwin and  Diana Inkpen and  Amir H. Razavi and  Oana Frunza and  Morvarid Sehatkar and  Leanne Seaward},
chapter={Classifying Biomedical Abstracts Using Committees of Classifiers and Collective Ranking Techniques},
publisher={Springer Berlin / Heidelberg},
ISSN={0302-9743 (Print) 1611-3349 (Online)},
volume={5549/2009},
title={Advances in Artificial Intelligence},
series={Lecture Notes in Computer Science},
DOI={10.1007/978-3-642-01818-3},
year={2009},
ISBN={978-3-642-01817-6},
pages={224--228 },
}


@misc{social-networks,
title={Introduction to Social Networks},
author={Hanneman, Robert and  Riddle, Mark},
year={2005},
howpublished={\url{http://www.faculty.ucr.edu/~hanneman/nettext/}},
address={Riverside, CA, USA},
}



@article{chinese-internet-topography,
title={Chinese {Internet} {AS-level} Topology},
author={Zhou, S. and  Zhang, G.-Q.},
journal={Communications, IET},
year={ 2007},
Volume={1},
number={2},
pages={ 209 - 214},
ISSN={1751-8628},
doi={10.1049/iet-com:20060518},
} 



@article{360421,
 author = {Hipp, Jochen and G\"{u}ntzer, Ulrich and Nakhaeizadeh, Gholamreza},
 title = {Algorithms for Association Rule Mining --- a General Survey and Comparison},
 journal = {SIGKDD Explor. Newsl.},
 volume = {2},
 number = {1},
 year = {2000},
 issn = {1931-0145},
 pages = {58--64},
 doi = {http://doi.acm.org/10.1145/360402.360421},
 publisher = {ACM},
 address = {New York, NY, USA},
 }



@article{1453913,
 author = {Koltsidas, Ioannis and Viglas, Stratis D.},
 title = {Flashing up the storage layer},
 journal = {Proc. VLDB Endow.},
 volume = {1},
 number = {1},
 year = {2008},
 issn = {2150-8097},
 pages = {514--525},
 doi = {http://doi.acm.org/10.1145/1453856.1453913},
 publisher = {VLDB Endowment},
 }

@conference{agrawal2008design,
  title={Design Tradeoffs for {SSD} Performance},
  author={Agrawal, N. and Prabhakaran, V. and Wobber, T. and Davis, J.D. and Manasse, M. and Panigrahy, R.},
  booktitle={USENIX Annual Technical Conference},
  pages={57--70},
  year={2008}
}

@inproceedings{1559937,
 author = {Lee, Sang-Won and Moon, Bongki and Park, Chanik},
 title = {Advances in Flash Memory {SSD} Technology for Enterprise Database Applications},
 booktitle = {SIGMOD '09},
 year = {2009},
 isbn = {978-1-60558-551-2},
 pages = {863--870},
 location = {Providence, Rhode Island, USA},
 doi = {http://doi.acm.org/10.1145/1559845.1559937},
 publisher = {ACM},
 address = {New York, NY, USA},
 }



@inproceedings{102547,
 author = {Wille, R.},
 title = {Knowledge Acquisition by Methods of Formal Concept Analysis},
 booktitle = {Proceedings of the Conference on Data Analysis, Learning Symbolic and Numeric Knowledge},
 year = {1989},
 isbn = {0-941743-64-0},
 pages = {365--380},
 location = {Antibes},
 publisher = {Nova Science Publishers, Inc.},
 address = {Commack, NY, USA},
 }



@string{tcad = "IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems"}
@string{dac82 = "Proc. 19th Design Automation Conference (DAC-82)"}
@string{dac88 = "Proc. 25th Design Automation Conference (DAC-88)"}
@string{iccd89 = "Proc. International Conference on Computer Design
                     (ICCD-89)"}
@string{iccad90 = "Proc. International Conference on Computer-Aided Design
                    (ICCAD-90)"}
@string{llc = "Literary and Linguistic Computing"}
@string{llc = "Lit. and Linguistic Comp."}
@string{jasist = "Journal of the American Society for Information Science and Technology"}
@string{csur = "ACM Computing Surveys"}



@article{322332,
 author = {Klug, Anthony},
 title = {Equivalence of Relational Algebra and Relational Calculus Query Languages Having Aggregate Functions},
 journal = {Journal ACM},
 volume = {29},
 number = {3},
 year = {1982},
 issn = {0004-5411},
 pages = {699--717},
 doi = {http://doi.acm.org/10.1145/322326.322332},
 publisher = {ACM},
 address = {New York, NY, USA},
 }



@inproceedings{DBLP:conf/icde/Agrawal87,
  author    = {Rakesh Agrawal},
  title     = {Alpha: An Extension of Relational Algebra to Express a Class
               of Recursive Queries},
  booktitle = {ICDE'87},
  year      = {1987},
  pages     = {580-590}
}


@article{1132963,
 author = {Geng, Liqiang and Hamilton, Howard J.},
 title = {Interestingness measures for data mining: A survey},
 journal = {ACM Comput. Surv.},
 volume = {38},
 number = {3},
 year = {2006},
 issn = {0360-0300},
 pages = {9},
 doi = {http://doi.acm.org/10.1145/1132960.1132963},
 publisher = {ACM},
 address = {New York, NY, USA},
 }


@inproceedings{1006247,
 author = {Cozette, Olivier and Guermouche, Abdou and Utard, Gil},
 title = {Adaptive Paging for a Multifrontal Solver},
 booktitle = {ICS '04: Proceedings of the 18th annual international conference on Supercomputing},
 year = {2004},
 isbn = {1-58113-839-3},
 pages = {267--276},
 location = {Malo, France},
 doi = {http://doi.acm.org/10.1145/1006209.1006247},
 publisher = {ACM},
 address = {New York, NY, USA},
 }


@misc{usb3,
author ={{Hewlett}{ Packard} and Intel and Microsoft and {NEC} and {ST-NXP} and {Texas}{ Instruments}},
title={Universal Serial Bus Specification},
year={2008},
howpublished={\url{http://www.usb.org}}
}

@article{1516514,
 author = {Grohe, Martin and Hernich, Andr\'{e} and Schweikardt, Nicole},
 title = {Lower bounds for processing data with few random accesses to external memory},
 journal = {J. ACM},
 volume = {56},
 number = {3},
 year = {2009},
 issn = {0004-5411},
 pages = {1--58},
 doi = {http://doi.acm.org/10.1145/1516512.1516514},
 publisher = {ACM},
 address = {New York, NY, USA},
 }


@inproceedings{1514927,
 author = {Chakaravarthy, Venkatesan T. and Pandit, Vinayaka and Sabharwal, Yogish},
 title = {Analysis of sampling techniques for association rule mining},
 booktitle = {ICDT '09: Proceedings of the 12th International Conference on Database Theory},
 year = {2009},
 isbn = {978-1-60558-423-2},
 pages = {276--283},
 location = {St. Petersburg, Russia},
 doi = {http://doi.acm.org/10.1145/1514894.1514927},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@comment later addition is given later.
@book{kimball2002dwtoolkit,
  author = {Ralph Kimball and Margy Ross},
  edition = {2nd},
  interHash = {d9c559968f8cb142089dc8a14c92c585},
  intraHash = {32fe9dd2aa05806f37ac047ba151cc7b},
  publisher = {Wiley},
  title = {The Data Warehouse Toolkit: The Complete Guide to Dimensional Modeling},
  year = {2002},
  bibitemlabel = {KiR02},
  month = {April}
}

@inproceedings{1183515,
 author = {Rizzi, Stefano and Abell\'{o}, Alberto and Lechtenb\"{o}rger, Jens and Trujillo, Juan},
 title = {Research in Data Warehouse Modeling and Design: Dead or Alive?},
 booktitle = {DOLAP '06},
 year = {2006},
 isbn = {1-59593-530-4},
 pages = {3--10},
 location = {Arlington, Virginia, USA},
 doi = {http://doi.acm.org/10.1145/1183512.1183515},
 publisher = {ACM},
 address = {New York, NY, USA},
 }




@article{1497580,
 author = {Cerf, Lo\"{\i}c and Besson,, J\'{e}r\'{e}my and Robardet,
C\'{e}line and Boulicaut,, Jean-Fran\c{c}ois},
 title = {Closed Patterns Meet N-ary Relations},
 journal = {ACM Trans. Knowl. Discov. Data},
 volume = {3},
 number = {1},
 year = {2009},
 issn = {1556-4681},
 pages = {1--36},
 doi = {http://doi.acm.org/10.1145/1497577.1497580},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@MISC{hazel-website,
author = {Hazel Webb},
title = {Code Archive},
publisher= {hazel-webb.com},
howpublished={\url{http://www.hazel-webb.com/archive.htm}},
year ={2009},
note={(Last checked 06-09-2010)}
}

@book{sql-standard-2008, 
Author = {{ISO}{~9075-1}:2008}, 
publisher = {{ISO}, Geneva, Switzerland},
Title = {Information technology:  database languages -- {SQL}-- Part 1 Framework}, 
edition= {3rd},
year={2008}
}


@ARTICLE{estaciomoreno-2008-136,
  author = {Alexander Estacio-Moreno and Yannick Toussaint and Cedric Bousquet},
  title = {Mining for adverse drug events with formal concept analysis},
  journal = {STUDIES IN HEALTH TECHNOLOGY AND INFORMATICS},
  volume = {136},
  pages = {803},
  url = {http://www.citebase.org/abstract?id=oai:arXiv.org:0901.4004},
  year = {2008}
}


@MISC{hirsch-2005,
  author = {J.~E. Hirsch},
  title = {An Index to Quantify an Individual's Scientific Research Output},
  doi={http://doi:10.1073/pnas.0507655102},
year = {2005},
 note = {\url{doi:10.1073/pnas.0507655102} (Last checked 07-29-2009)},
  
}


@article{1391730,
 author = {Ilyas, Ihab F. and Beskales, George and Soliman, Mohamed A.},
 title = {A Survey of Top-k Query Processing Techniques in Relational Database Systems},
 journal = {ACM Comput. Surv.},
 volume = {40},
 number = {4},
 year = {2008},
 issn = {0360-0300},
 pages = {1--58},
 doi = {http://doi.acm.org/10.1145/1391729.1391730},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@article{1287623,
 author = {Morfonios, Konstantinos and Konakas, Stratis and Ioannidis, Yannis and Kotsis, Nikolaos},
 title = {{ROLAP} Implementations of the Data Cube},
 journal = {ACM Comput. Surv.},
 volume = {39},
 number = {4},
 year = {2007},
 issn = {0360-0300},
 pages = {12},
 doi = {http://doi.acm.org/10.1145/1287620.1287623},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@MISC{Holzapfel06thecomplexity,
    author = {Klaus Holzapfel and Sven Kosub and Moritz G. Maa\ss{} and Hanjo T\"aubig},
    title = {The Complexity of Detecting Fixed-Density Clusters},
    year = {2006}
}




@INPROCEEDINGS{Raghavan03representingweb,
    author = {Sriram Raghavan and Hector Garcia-Molina},
    title = {Representing {Web} Graphs},
    booktitle = {ICDE'03},
    year = {2003},
    pages = {1--10},
    publisher = {ACM Press}
}


@misc{matryoshka,
author = {Roosevelt, Priscilla},
title={Matryoshka Dolls},
booktitle={ Encyclopedia of Russian History},
publisher={ The Gale Group Inc. 2004},
note={\url{ http://www.encyclopedia.com/doc/1G2-3404100805.html} (Last checked 07-29-2009)},
year={2009}
}

@misc{olap-council,
author = {{{OLAP} Council, The}},
title = {{OLAP} and {OLAP} Server Definitions},
note = {\url{http://www.olapcouncil.org/research/resrchly.htm} (Last checked 07-29-2009)}}
}

@inproceedings{chamberlain74,
 author = {Chamberlin, Donald D. and Boyce, Raymond F.},
 title = {SEQUEL: A Structured English Query Language},
 booktitle = {FIDET '74: Proceedings of the 1974 ACM SIGFIDET (now SIGMOD) workshop on Data description, access and control},
 year = {1974},
 pages = {249--264},
 location = {Ann Arbor, Michigan},
 doi = {http://doi.acm.org/10.1145/800296.811515},
 publisher = {ACM},
 address = {New York, NY, USA},
 }


@article{codd70,
 author = {Codd, E. F.},
 title = {A Relational Model of Data for Large Shared Data Banks},
 journal = {Commun. ACM},
 volume = {13},
 number = {6},
 year = {1970},
 issn = {0001-0782},
 pages = {377--387},
 doi = {http://doi.acm.org/10.1145/362384.362685},
 publisher = {ACM},
 address = {New York, NY, USA},
 }


@article{Newman2005PowerlawsPareto,
  author = {Newman, M.E.J.},
  interHash = {1e91cbd2816eaf41823f18b3db0808b9},
  intraHash = {9b1495ac8518d8993445de4ac89b0096},
  journal = {Contemporary Physics},
  number = {5},
  pages = {323--351},
  publisher = {Taylor \& Francis},
  title = {{Power laws, Pareto Distributions and Zipf's Law}},
  volume = {46},
  year = {2005},
  jlprojects = {size_scaling},
  file = {Newman2005PowerlawsPareto.pdf:Newman2005PowerlawsPareto.pdf:PDF}
}

@article{5038,
 author = {Armenakis,, A. C. and Garey,, L. E. and Gupta,, R. D.},
 title = {An Adaptation of a Root Finding Method to Searching Ordered Disk Files},
 journal = {BIT},
 volume = {25},
 number = {4},
 year = {1985},
 issn = {0006-3835},
 pages = {562--568},
 publisher = {BIT Computer Science and Numerical Mathematics},
 address = {Lawrence, KS, USA},
 }


@MastersThesis{stratton82,
title = {Comparison of Searching Techniques},
author = {A. C. Stratton},
year = {1982},
school = {University of New Brunswick}
}

@Article{Dowell:1972:PMC,
  author =       "M. Dowell and P. Jarratt",
  title =        "The {`Pegasus'} Method for Computing the Root of an
                 Equation",
  journal =      "{BIT} Numerical Mathematics",
  volume =       "12",
  number =       "4",
  pages =        "503--508",
  month =        dec,
  year =         "1972",
  CODEN =        "BITTEL, NBITAB",
  DOI =          "http://www.springerlink.com/openurl.asp?genre=article&id=doi:10.1007/BF01932959",
  ISSN =         "0006-3835 (print), 1572-9125 (electronic)",
  bibdate =      "Wed Jan 4 18:52:12 MST 2006",
  bibsource =    "ftp://ftp.math.utah.edu/pub/tex/bib/bit.bib;
                 http://springerlink.metapress.com/openurl.asp?genre=issue&issn=0006-3835&volume=12&issue=4",
  URL =          "http://www.springerlink.com/openurl.asp?genre=article&issn=0006-3835&volume=12&issue=4&spage=503",
  acknowledgement = ack-nhfb,
}


@proceedings{DBLP:conf/sigmod/97,
  editor    = {Joan Peckham},
  title     = {SIGMOD 1997, Proceedings ACM SIGMOD International Conference
               on Management of Data, May 13-15, 1997, Tucson, Arizona, USA},
  publisher = {ACM Press},
  year      = {1997},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@article{parnas94,
  author = {Z-Q Luo and D.L. Parnas},
  title = {On the Computational Complexity of the Maximum Trade Problem},
  journal = {Acta Mathematical Applicatae Sinica (English Series)},
  volume = {10},
  number = {4},
  year = {1994},
  issn = {0168-9673 (Print) 1618-3932 (Online)},
  pages = {434--440}
}


@article{sharma2008emc,
  title={An Efficient Multi-Component Indexing Embedded Bitmap Compression for Data Reorganization},
  author={Sharma, Y. and Goyal, N.},
  journal={Information Technology Journal},
  volume={7},
  number={1},
  pages={160--164},
  year={2008}
}


  @inproceedings{icebergsemijoin,
    title={Eficient Processing of Distributed Iceberg Semi-joins },
    author={Mohammed Kasim Imthiyaz and Dong Xiaoan and Panos Kalnis},
    booktitle= {Database and Expert Systems Applications 15th International Conference, DEXA 2004},
    pages={634--643},
    publisher={Springer Berlin/Heidelberg},
    year={2004},
    isbn={978-3-540-22936-0}
}

@inproceedings{bda08,
  author =       {Kamel Aouiche and Daniel Lemire and Owen Kaser},
  title =        {Tri de la table de faits et compression des index bitmaps avec alignement sur les mots},
  booktitle={BDA'08},
  year={2008} 
}
 @comment {note =         {available from
                \url{http://arxiv.org/abs/0805.3339}}


@TechReport{Wu2001,
  author =       {Kesheng Wu and Ekow J. Otoo and Arie Shoshani and Henrik Nordberg},
  title =        {Notes on Design and Implementation of Compressed Bit Vectors},
  institution =  {Lawrence Berkeley National Laboratory},
  year =         {2001},
   number =       {LBNL/PUB-3161},
  note =         {available from
                  \url{http://crd.lbl.gov/~kewu/ps/PUB-3161.html}}
}



@TechReport{diamond08,
  author =       {Hazel Webb  and Owen Kaser  and Daniel Lemire},
  title =        {Pruning Attribute Values from Data Cubes with Diamond Dicing},
  institution =  {Computer Science and Applied Statistics,
                  University of New Brunswick Saint John},
  year =         {2008},
   number =       {TR-08-011},
  note =         {available from
                  \url{http://arxiv.org/abs/0805.0747}}
}


@InProceedings{diamond-ideas,
  author = 	 {Hazel Webb  and Owen Kaser  and Daniel Lemire},
  title = 	 {Pruning Attribute Values from Data Cubes with Diamond Dicing},
  booktitle = {International Database Engineering and Applications Symposium (IDEAS'08)},
  pages = 	 {121--129},
  year = 	 2008}


@inproceedings{bennett2007np,
  title={The {Netflix} Prize},
  author={Bennett, J. and Lanning, S.},
  booktitle={KDD Cup and Workshop 2007},
  year={2007}
}


@inproceedings{kamel08,
author={Kamel Aouiche and Daniel Lemire and Robert Godin},
title={Collaborative {OLAP} with Tag Clouds: {Web 2.0 OLAP} Formalism and Experimental Evaluation},
booktitle={WEBIST'08},
year={2008},
pages={51-64}
}

@inbook{kamel09,
author={Kamel Aouiche and Daniel Lemire and Robert Godin},
title={Web Information Systems and Technologies},
chapter={{Web 2.0 OLAP}: From Data Cubes to Tag Clouds},
series={Lecture Notes in Business Information Processing},
volume=18,
year={2009},
pages={51-64},
publisher={Springer}
}

@article{1328925,
 author = {Daniel Lemire and Owen Kaser},
 title = {Hierarchical Bin Buffering: Online Local Moments for Dynamic External Memory Arrays},
 journal = {ACM Trans. Algorithms},
 volume = {4},
 number = {1},
 year = {2008},
 issn = {1549-6325},
 pages = {1--31} }


@inproceedings{ vitter98data,
  author =       "Jeffrey Scott {Vitter} and Min {Wang} and Bala
                  {Iyer}",
  title =        "Data Cube Approximation and Histograms via Wavelets",
  booktitle =    "CIKM '98",

  address =      "New York, U.S.A.",
  isbn =         "1-58113-061-9",
  pages =        "96--104",
  year =         "1998",
  url =          "citeseer.ist.psu.edu/vitter98data.html"
}
editor and publisher of above entry if needed at some later date:
editor=         "Georges {Gardarin} and James C. {French} and Niki
                  {Pissinou} and Kia {Makki} and Luc {Bouganim}",
publisher =    "Association for Computing Machinery",

@inproceedings{ dehne05pnp,
  author =       "Y. Chen and T. Eavis and F. Dehne and
                  A. {Rau-Chaplin}",
  title =        "{PnP}: Parallel and External Memory Iceberg Cube
                  Computation",
  text =         "Chen, Dehne, Eavis, Rau-Chaplin. PnP: Parallel and
                  external memory iceberg cube computation. ICDE,
                  2005.",
  booktitle =   "ICDE'05",
  pages =       "576--577",
  year =         "2005",
  url =          "citeseer.ist.psu.edu/dehne05pnp.html"
}

@inproceedings{ roussopoulos97cubetree,
  author =       "Nick Roussopoulos and Yannis Kotidis and Mema
                  Roussopoulos",
  title =        "Cubetree: organization of and bulk incremental
                  updates on the data cube",
  pages =        "89--99",
  year =         "1997",
  url =          "citeseer.ist.psu.edu/roussopoulos97cubetree.html"
}
@Misc{qdbm,
  author="Mikio Hirabayashi",
  title="{QDBM}: Quick Database Manager",
  year={2006},
  howpublished = "\url{http://qdbm.sourceforge.net/}~(checked 2008-02-22)"
  }


@Misc{qdbm---fr,
  author="Mikio Hirabayashi",
  title="{QDBM}: Quick Database Manager",
  year={2006},
  howpublished = "En ligne~: \url{http://qdbm.sourceforge.net/}",
    note = "Dernier acc\`es le 22 f\'evrier 2008"
  }

@Misc{netflix---fr,
  author = "{Netflix, Inc.}",
  title = "Netflix prize {README}",
  howpublished = "En ligne~: \url{http://www.netflixprize.com/community/viewtopic.php?id=68}",
  note = "Dernier acc\`es le 4 janvier 2008",
  year = 2007
  }

@Misc{netflix,
  author = "{Netflix, Inc.}",
  title = "Netflix prize {README}",
  howpublished = "online: \url{http://www.netflixprize.com/community/viewtopic.php?id=68} (Last checked 06-09-2010)",
  year = 2007
  }


@inproceedings{1183517,
  author =       "Riadh {Ben Messaoud} and Sabine {Loudcher
                  Rabas{\'{e}}da} and Omar Boussaid and Rokia Missaoui",
  title =        "Enhanced Mining of Association Rules from Data
                  Cubes",
  booktitle =    "DOLAP '06",
  year =         "2006",
  pages =        "11--18"}

@inproceedings{DBLP:conf/dolap/MessaoudRBM06,
  author =       "Riadh {Ben Messaoud} and Sabine {Loudcher Rabas{\'e}da}
                  and Omar Boussaid and Rokia Missaoui",
  title =        "Enhanced mining of association rules from data
                  cubes.",
  booktitle =    "DOLAP",
  year =         "2006",
  pages =        "11-18",
  ee =           "http://doi.acm.org/10.1145/1183512.1183517",
  crossref =     "DBLP:conf/dolap/2006",
  bibsource =    "DBLP, http://dblp.uni-trier.de",
  OwenDeprecationNote = "DEPRECATED, duplicate, use 1183517"
}

@proceedings{DBLP:conf/dolap/2006,
  editor =       "Il-Yeol Song and Panos Vassiliadis",
  title =        "DOLAP 2006, ACM 9th International Workshop on Data
                  Warehousing and OLAP, Arlington, Virginia, USA,
                  November 10, 2006, Proceedings",
  booktitle =    "DOLAP"
}

@article{KaserLemireIS2006,
  author =       "Owen Kaser and Daniel Lemire",
  title =        "Attribute Value Reordering For Efficient Hybrid
                  {OLAP}",
  journal =      "Information Sciences",
  volume =       "176",
  number =       "16",
  pages =        "2304--2336",
  year =         2006
}

@book{diamond,
  author =       "{Encyclop{\ae}dia Brittanica online}",
  publisher = "Encyclop{\ae}dia Brittanica, Inc.",
  title =        "diamond",
  year =         "2007",
  howpublished = "\url{http://http://search.eb.com/eb/article-9030264}",
  note =         "Last checked 07-29-2009"
}

@article{321107,
  author =       "Stephen Warshall",
  title =        "A Theorem on Boolean Matrices",
  journal =      "J. ACM",
  volume =       "9",
  number =       "1",
  year =         "1962",
  issn =         "0004-5411",
  pages =        "11--12",
  doi =          "http://doi.acm.org/10.1145/321105.321107",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{DBLP:conf/popl/AhoU79,
  author =       {Alfred V. Aho and Jeffrey D. Ullman},
  title =        "The Universality of Data Retrieval Languages",
  booktitle =    "POPL",
  year =         "1979",
  pages =        "110-120",
  ee =           "db/conf/popl/AhoU79.html",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{Boulicautkdid2005,
  author =       "J{\'e}r{\'e}my Besson and Ruggero Pensa and
                  C{\'e}line Robardet and Jean-Francois Boulicaut",
  title =        "Constraint-based mining of fault tolerant patterns
                  from Boolean data",
  booktitle =    "KDID'05",
  year =         "2005",
  url =          {http://liris.cnrs.fr/~jboulica/kdid05.pdf}
}

@article{1024313,
  author =       "Sara C. Madeira and Arlindo L. Oliveira",
  title =        "Biclustering Algorithms for Biological Data
                  Analysis: A Survey",
  journal =      "IEEE/ACM Trans. Comput. Biol. Bioinformatics",
  volume =       "1",
  number =       "1",
  year =         "2004",
  issn =         "1545-5963",
  pages =        "24--45",
  doi =          "http://dx.doi.org/10.1109/TCBB.2004.2",
  publisher =    "IEEE Computer Society Press",
  address =      "Los Alamitos, CA, USA",
}

@inproceedings{660833,
  author =       "Yizong Cheng and George M. Church",
  title =        "Biclustering of Expression Data",
  booktitle =    "Proceedings of the Eighth International Conference
                  on Intelligent Systems for Molecular Biology",
  year =         "2000",
  isbn =         "1-57735-115-0",
  pages =        "93--103",
  publisher =    "AAAI Press",
}

@TechReport{peet:MEBP-tr,
  author =       "R. Peeters",
  title =        "The Maximum-Edge Biclique Problem is {NP}-Complete",
  institution =  "Faculty of Economics and Business Administration,
                  Tilberg University",
  year =         2000,
  type =         "Research Memorandum",
  number =       789,
  url =          "http://econpapers.hhs.se/paper/dgrkubrem/2000789.htm
                  (checked 2004-20-01)"
}

@article{Lian2005,
  author =       "Wang Lian and David W. Cheung and S. M. Yiu",
  title =        {An Efficient Algorithm for Finding Dense Regions for
                  Mining Quantitative Association Rules},
  journal =      "Computers \& Mathematics with Applications",
  year =         "2005",
  month =        "August",
  pages =        "471--490",
  volume =       "50",
  number =       "3-4",
  url =
                  {http://www.sciencedirect.com/science/article/B6TYJ-4HDHH0H-G/2/968ce2d32c5c68133ab7227e850d6d}
}

@inproceedings{1007588,
  author =       "Graham Cormode and Flip Korn and S. Muthukrishnan
                  and Divesh Srivastava",
  title =        "Diamond in the Rough: Finding Hierarchical Heavy
                  Hitters in Multi-dimensional Data",
  booktitle =    "SIGMOD '04",
  year =         "2004",
  isbn =         "1-58113-859-8",
  pages =        "155--166",
  location =     "Paris, France",
  doi =          "http://doi.acm.org/10.1145/1007568.1007588",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{amazon2003,
  author =       "Greg Linden and Brent Smith and Jeremy York",
  title =        "Amazon.com Recommendations: Item-to-Item
                  Collaborative Filtering",
  journal =      "IEEE Internet Computing",
  volume =       "7",
  number =       "1",
  pages =        "76-80",
  year =         "2003"
}

@article{pitas1989far,
  title =        "Fast algorithms for running ordering and max/min
                  calculation",
  author =       "Pitas, I.",
  journal =      "IEEE Transactions on Circuits and Systems",
  volume =       "36",
  number =       "6",
  pages =        "795-804",
  year =         1989
}

@article{139337,
  author =       "Marcel van Herk",
  title =        "A fast algorithm for local minimum and maximum
                  filters on rectangular and octagonal kernels",
  journal =      "Pattern Recogn. Lett.",
  volume =       "13",
  number =       "7",
  year =         "1992",
  issn =         "0167-8655",
  pages =        "517--521",
  doi =          "http://dx.doi.org/10.1016/0167-8655(92)90069-C",
  publisher =    "Elsevier Science Inc.",
  address =      "New York, NY, USA",
}

@inproceedings{YLBICDMO05,
  author =       "Daniel Lemire and Martin Brooks and Yuhong Yan",
  title =        "An Optimal Linear Time Algorithm for Quasi-Monotonic
                  Segmentation",
  booktitle =    "ICDM'05",
  pages =        "709--712",
  year =         2005
}

@article{602401,
  author =       "Jim Gray",
  title =        "What next?: A dozen information-technology research
                  goals",
  journal =      "J. ACM",
  volume =       "50",
  number =       "1",
  year =         "2003",
  issn =         "0004-5411",
  pages =        "41--57",
  doi =          "http://doi.acm.org/10.1145/602382.602401",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{keogh2005eid,
  title =        "Exact indexing of dynamic time warping",
  author =       "Keogh, E. and Ratanamahatana, C. A.",
  journal =      "Knowledge and Information Systems",
  volume =       "7",
  number =       "3",
  pages =        "358-386",
  year =         "2005",
  publisher =    {Springer}
}

@article{628474,
  author =       "J. Gil and M. Werman",
  title =        "Computing 2-D Min, Median, and Max Filters",
  journal =      "IEEE Trans. Pattern Anal. Mach. Intell.",
  volume =       "15",
  number =       "5",
  year =         "1993",
  issn =         "0162-8828",
  pages =        "504--507",
  doi =          "http://dx.doi.org/10.1109/34.211471",
  publisher =    "IEEE Computer Society",
  address =      "Washington, DC, USA",
}

@article{628856,
  author =       "Joseph (Yossi) Gil and Ron Kimmel",
  title =        "Efficient Dilation, Erosion, Opening, and Closing
                  Algorithms",
  journal =      "IEEE Trans. Pattern Anal. Mach. Intell.",
  volume =       "24",
  number =       "12",
  year =         "2002",
  issn =         "0162-8828",
  pages =        "1606--1617",
  doi =          "http://dx.doi.org/10.1109/TPAMI.2002.1114852",
  publisher =    "IEEE Computer Society",
  address =      "Washington, DC, USA",
}

@TechReport{lemiremaxminarxiv,
  author =       "Daniel Lemire",
  title =        "Streaming Maximum-Minimum Filter Using No More than
                  3 Comparisons per Element",
  institution =  "arxiv.org",
  year =         "2006",
  number =       {cs.DS/0610046}
}

@article{han2005sca,
  title =        "{Stream Cube}: An Architecture for Multi-Dimensional
                  Analysis of Data Streams",
  author =       "Han, J. and Chen, Y. and Dong, G. and Pei, J. and
                  Wah, B. W. and Wang, J. and Cai, Y. D.",
  journal =      "Distributed and Parallel Databases",
  volume =       "18",
  number =       "2",
  pages =        "173-197",
  year =         "2005",
  publisher =    {Springer}
}

@inproceedings{LemireCASCON2002,
  author =       "Daniel Lemire",
  title =        "Wavelet-Based Relative Prefix Sum Methods for Range
                  Sum Queries in Data Cubes",
  booktitle =    "Proceedings of CASCON 2002",
  organization = "IBM",
  month =        "October",
  year =         2002
}

@inproceedings{LemireDOLAP2003,
  author =       "Owen Kaser and Daniel Lemire",
  title =        "Attribute Value Reordering for Efficient Hybrid
                  {OLAP}",
  booktitle =    "Proceedings of DOLAP'03",
  organization = "ACM",
  month =        "November",
  year =         2003
}

@inproceedings{propolyne,
  author =       "R. R. Schmidt and C. Shahabi",
  title =        "{ProPolyne}: A Fast Wavelet-based Algorithm for
                  Progressive Evaluation of Polynomial Range-Sum
                  Queries",
  booktitle =    "Conference on Extending Database Technology",
  country =      "Prague",
  month =        "March",
  year =         "2002",
  pages =        "664--681"
}

@InProceedings{sdm05,
  author =       "Jian Pei and Moonjung Cho and David Cheung",
  title =        "Cross Table Cubing: Mining Iceberg Cubes from Data
                  Warehouses",
  booktitle =    "SDM'05",
  url =
                  "http://www.csis.hku.hk/%7Edcheung/publication/sdm05.pdf",
  year =         "2005",
pages =          "461-465"

}
@inproceedings{netfli,
author={Fusco, F. and Stoecklin, M. P. and Vlachos, M.},
title={{NET-FLi}: On-the-fly Compression, Archiving and Indexing of Streaming Network Traffic},
booktitle={VLDB'10},
 publisher = {VLDB Endowment},
 address= {San Jose, CA, USA},
year={2010}
}


@inproceedings{DBLP:conf/vldb/XinHLW03,
  author    = "Dong Xin and
               Jiawei Han and
               Xiaolei Li and
               Benjamin W. Wah",
  title     = "Star-Cubing: Computing Iceberg Cubes by Top-Down and Bottom-Up
               Integration",
  booktitle = "VLDB'03",
   publisher = {VLDB Endowment},
  year      = "2003",
  pages     = "476-487",
  ee        = "http://www.vldb.org/conf/2003/papers/S15P02.pdf",
  bibsource = "DBLP, http://dblp.uni-trier.de"
}

@article{992883,
  author =       "Seok-Ju Chun and Chin-Wan Chung and Seok-Lyong Lee",
  title =        "Space-efficient cubes for {OLAP} range-sum queries",
  journal =      "Decision Support Systems",
  volume =       "37",
  number =       "1",
  year =         "2004",
  issn =         "0167-9236",
  pages =        "83--102",
  doi =          "http://dx.doi.org/10.1016/S0167-9236(03)00003-4",
  publisher =    "Elsevier Science Publishers B. V.",
  address =      "Amsterdam, The Netherlands, The Netherlands",
  topic =        "OLAP",
  subtopic =     "Query evaluation - Range Queries",
  url =
                  "http://www.sm.luth.se/csee/csn/publications/Space-Efficient_Range-Sum_Queries_in_OLAP.pdf"
}

@article{shahabi05,
  author =       "Cyrus Shahabi and Mehrdad Jahangiri and Dimitris
                  Sacharidis",
  url =
                  "http://www.igi-online.com/downloads/pdf/ITJ2783_h8AQIgOg5Y.pdf",
  title =        "Hybrid Query and Data Ordering for Fast and
                  Progressive Range-Aggregate Query Answering",
  journal =      "International Journal of Data Warehousing and
                  Mining",
  Month =        apr,
  volume =       "1",
  number =       "2",
  year =         "2005",
  topic =        "OLAP",
  subtopic =     "Query evaluation - Range Queries"
}

@article{Poon296,
  author =       "C. K. Poon",
  url =          "http://www.cs.cityu.edu.hk/%7Eckpoon/research/olap1full.ps",
  title =        "Dynamic Orthogonal Range Queries in {OLAP}",
  journal =      "Theoretical Computer Science",
  volume =       "296",
  number =       "3",
  pages =        "487--510",
  year =         "2003",
  topic =        "OLAP",
  subtopic =     "Query evaluation - Range Queries"
}

@inproceedings{PoonICDT2003,
  author =       "C. K. Poon",
  url =
                  "http://www.cs.cityu.edu.hk/%7Eckpoon/research/olap2.ps",
  title =        "Optimal Range Max Datacube for Fixed Dimensions",
  booktitle =    "ICDT",
  year =         "2003",
  pages =        "158--172",
  topic =        "OLAP",
  subtopic =     "Query evaluation - Range Queries"
}

@inproceedings{ vitter99:approximate,
  author =       "Jeffrey Scott Vitter and Min Wang",
  title =        "Approximate computation of multidimensional
                  aggregates of sparse data using wavelets",
  booktitle =    "ACM SIGMOD",
  pages =        "193--204",
  year =         "1999",
  url =
                  "http://citeseer.ist.psu.edu/vitter99approximate.html" ,
  topic =        "OLAP",
  subtopic =     "Query evaluation - Range Queries"
}

@Article{Kaser2004,
  author =       "Owen Kaser",
  title =        "Compressing arrays by ordering attribute values",
  journal =      "Information Processing Letters",
  year =         2004,
  volume =       92,
  number =       5,
  pages =        "253--256",
  month =        {December}
}

@inproceedings{ agrawal94fast,
  author =       "Rakesh Agrawal and Ramakrishnan Srikant",
  title =        "Fast Algorithms for Mining Association Rules",
  booktitle =    "VLDB'94",
  month =        "12--15~",
  publisher =    "Morgan Kaufmann",
  editor =       "Jorge B. Bocca and Matthias Jarke and Carlo Zaniolo",
  isbn =         "1-55860-153-8",
  pages =        "487--499",
  year =         "1994",
  url =          "citeseer.ist.psu.edu/agrawal94fast.html"
}

@Article{mafia05,
  author =       "Doug Burdick and Manuel Calimlim and Jason Flannick
                  and Johannes Gehrke and Tomi Yiu",
  title =        "MAFIA: A Maximal Frequent Itemset Algorithm" ,
  journal =      "IEEE Transactions on Knowledge and Data Engineering",
  volume =       "17",
  number =       "11",
  pages =        "1490-1504",
  month =        "November",
  year =         "2001"
}

@article{tweed,
  author =       "Jan Oaskar Engene",
  title =        "Five Decades of Terrorism in {Europe}: The {TWEED} Dataset",
  ISBN =         "82-92770-00-3",
  journal =      "Journal of Peace Research",
  volume =       "44",
  number =       "1",
  pages =        "109--121",
  year =         "2007"
  }

@article{Korukonda06,
  author =       "A. R. Korukonda",
  title =        "Technique without theory or theory from technique?
                  An examination of practical, philosophical and
                  foundational issues in data mining",
  journal =      "AI and Society The Journal of Human-Centred Systems",
  month =        "August",
  year =         "2006"
}

@article{Lowell03,
  author =       "Various authors",
  title =        "The Lowell Database Research Self Assessment",
  year =         "2003",
  month =        "May",
  publisher =    "Lowell, Massachusetts USA",
  url =          "http://research.microsoft.com/~Gray/lowell"
}

@article{lowell2005,
  title =        "The {Lowell} database research self-assessment",
  author =       "Abiteboul, S. and others",
  journal =      "Communications of the ACM",
  volume =       "48",
  number =       "5",
  pages =        "111-118",
  year =         2005
}

@article{szalay2006cse,
  title =        "{2020 Computing}: Science in an exponential world",
  author =       "Szalay, A. and Gray, J.",
  journal =      "Nature",
  pages =        "413--414",
  volume =       "440",
  year =         2006
}

@PhdThesis{goil:thesis,
  author =       "Sanjay Goil",
  title =        "High Performance On-line Analytical Processing and
                  Data Mining on Parallel Computers",
  school =       "Dept. ECE, Northwestern University",
  year =         1999
}

@inproceedings{Techapichetvanich2005,
  author =       "Kesaraporn Techapichetvanich and Amitava Datta",
  title =        "Interactive Visualization for {OLAP}",
  booktitle =    "ICCSA '05",
  year =         "2005",
  pages =        {206--214}
}

@inproceedings{956063,
  author =       "Andreas S. Maniatis and Panos Vassiliadis and Spiros
                  Skiadopoulos and Yannis Vassiliou",
  title =        "Advanced visualization for {OLAP}",
  booktitle =    "DOLAP '03",
  year =         "2003",
  isbn =         "1-58113-727-3",
  pages =        "9--16",
  location =     "New Orleans, Louisiana, USA",
  doi =          "http://doi.acm.org/10.1145/956060.956063",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{maniatis2005pmn,
  title =        "A Presentation Model \& Non-Traditional
                  Visualization for {OLAP}",
  author =       "Maniatis, A. and Vassiliadis, P. and Skiadopoulos,
                  S. and Vassiliou, Y. and Mavrogonatos, G. and
                  Michalarias, I.",
  journal =      "International Journal of Data Warehousing and
                  Mining",
  volume =       "1",
  pages =        "1--36",
  year =         2005
}

@article{Hartigan72,
  author =       "Hartigan, J. A.",
  citeulike-article-id ="635756",
  journal =      "Journal of American Statistical Association",
  keywords =     "clustering",
  pages =        "123--129",
  priority =     "2",
  title =        "Direct clustering of a data matrix",
  volume =       "67(337)",
  year =         1972
}

@misc{Keesings,
  title =        "Keesing's Worldwide Online",
  url =          "http://www.keesings.com",
  note =         "Last checked 07-29-2009"
}

@article{Pearson06,
  author =       "Pearson, R. K.",
  journal =      "SIGKDDExplorations",
  volume =       "8",
  number =       "1",
  year =         "2006",
  month =        "June",
  title =        "The Problem of Disguised Missing Data",
  pages =        "83--92"
}

@book{Cheney,
  author =       "Ward Cheney and David Kincaid",
  publisher =    "Brooks Cole Publishing",
  title =        "Numerical Mathematics and Computing",
  edition =      "3rd",
  year =         "1998",
  ISBN =         "0-534-50019-6"
}

@article{Time2003,
  title =        "Numbers",
  year =         "2003",
  month =        "April 28",
  journal =      "Time Magazine"
}

@article{253288,
  author =       "Yihong Zhao and Prasad M. Deshpande and Jeffrey
                  F. Naughton",
  title =        "An array-based algorithm for simultaneous
                  multidimensional aggregates",
  journal =      "SIGMOD Rec.",
  volume =       "26",
  number =       "2",
  year =         "1997",
  issn =         "0163-5808",
  pages =        "159--170",
  doi =          "http://doi.acm.org/10.1145/253262.253288",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{conf/mldm/KayaA03,
  title =        "Integrating Fuzziness with {OLAP} Association Rules
                  Mining",
  author =       "Mehmet Kaya and Reda Alhajj",
  bibdate =      "2003-06-26",
  bibsource =    "DBLP,
                  http://dblp.uni-trier.de/db/conf/mldm/mldm2003.html#KayaA03",
  booktitle =    "MLDM 2003",
  publisher =    "Springer",
  year =         "2003",
  volume =       "2734",
  editor =       "Petra Perner and Azriel Rosenfeld",
  ISBN =         "3-540-40504-6",
  pages =        "353--368",
  series =       "Lecture Notes in Computer Science",
  URL =
                  "http://link.springer.de/link/service/series/0558/bibs/2734/27340353.htm",
}

@InProceedings{ncstrl.ustuttgart_fi//INPROC-2005-17,
  cr-category =  "H.2.7 Database Administration",
  cr-category =  "H.2.8 Database Applications",
  language =     "English",
  publisher =    "Springer",
  year =         "2005",
  ISBN =         "3-540-25878-7",
  pages =        "1--9",
  notes =        "; citation: Building the Data Warehouse of Frequent
                  Itemsets in the DWFIST Approach. In: Proceedings of
                  the 15th International Symposium on Methodologies
                  for Intelligent Systems Saratoga Springs, New York -
                  May 25-28, 2005",
  series =       "Artikel in Tagungsband",
  institution =  "Universit{\"a}t Stuttgart, Fakult{\"a}t Informatik,
                  Elektrotechnik und Informationstechnik, Germany",
  author =       "Rodrigo Salvador Monteiro and Geraldo Zimbrao and
                  Holger Schwarz and Bernhard Mitschang and Jano
                  Moreira De Souza",
  month =        may,
  type =         "Article in Proceedings",
  title =        "Building the Data Warehouse of Frequent Itemsets in
                  the {DWFIST} Approach",
  booktitle =    "Proceedings of the 15th International Symposium on
                  Methodologies for Intelligent Systems Saratoga
                  Springs, New York - May 25-28, 2005",
  bibdate =      "February 24, 2005",
}

@article{304214,
  author =       "Kevin Beyer and Raghu Ramakrishnan",
  title =        "Bottom-up computation of sparse and Iceberg CUBE",
  journal =      "SIGMOD Rec.",
  volume =       "28",
  number =       "2",
  year =         "1999",
  issn =         "0163-5808",
  pages =        "359--370",
  doi =          "http://doi.acm.org/10.1145/304181.304214",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{bhuvanagiri2006sae,
  title =        "Simpler Algorithm for Estimating Frequency Moments
                  of Data Streams",
  author =       "Bhuvanagiri, L. and Ganguly, S. and Kesh, D. and
                  Saha, C.",
  journal =      "SODA'06",
  pages =        "708--713",
  year =         "2006",
  publisher =    {ACM Press New York, NY, USA}
}

@article{indyk2005oaf,
  title =        "Optimal Approximations of the Frequency Moments of
                  Data Streams",
  author =       "Indyk, P. and Woodruff, D.",
  journal =      "Proceedings of the thirty-seventh annual ACM
                  symposium on Theory of computing",
  pages =        "202-208",
  year =         "2005",
  publisher =    {ACM Press New York, NY, USA}
}

@inproceedings{schmidt1993chb,
  title =        "{Chernoff-Hoeffding} Bounds for Applications with
                  Limited Independence",
  author =       "Schmidt, J. P. and Siegel, A. and Srinivasan, A.",
  booktitle =    "SODA'93",
  pages =        "331--340",
  year =         1993
}

@comment{%publisher={Society for Industrial and Applied Mathematics Philadelphia, PA, USA}}
@book{folland1984ram,
  title =        "Real Analysis: Modern Techniques and Their
                  Applications",
  author =       "Folland, G. B.",
  year =         "1984",
  pages = {368},
  publisher =    {Wiley}
}

@Misc{bour:uniformRNGpage,
  author =       "Paul Bourke",
  title =        "Uniform Random Number Generator",
  howpublished = "online:
                  \url{http://astronomy.swin.edu.au/~pbourke/other/random/index.html}",
  month =        mar,
  year =         1998,
  note =         {checked 2007-05-30}
}

@misc{oracle9_compress,
  title =        "Decision Speed: Table Compression In Action",
  author =       "Meikel Poess and Hermann Baer",
  howpublished = "online:
                  \url{http://www.oracle.com/technology/oramag/webcolumns/2003/techarticles/poess_tablecomp.html}",
  year =         2003
}

@misc{lewisdbazine,
  author =       "Jonathan Lewis",
  title =        "Understanding Bitmap Indexes",
  howpublished = "online:
                  \url{http://www.dbazine.com/oracle/or-articles/jlewis3}",
  year =         2006
}

@misc{oraclevivekbitmap---fr,
  title =        "Bitmap Index vs. B-tree Index: Which and When?",
  author =       "Vivek Sharma",
  howpublished = "En ligne~:
                  \url{http://www.oracle.com/technology/pub/articles/sharma_indexes.html}",
  note = "Dernier acc\`es le 22 avril 2008.",
  year =         2005,
  month =        "mars",
  day =          11
}

@misc{oraclevivekbitmap,
  title =        "Bitmap Index vs. B-tree Index: Which and When?",
  author =       "Vivek Sharma",
  howpublished = "online:
                  \url{http://www.oracle.com/technology/pub/articles/sharma_indexes.html}",
  year =         2005,
  month =        "March",
  day =          11
}

@Misc{haah:randomorg,
  author =       "Mads Haahr",
  title =        "{random.org} --- True Random Number Service",
  howpublished = "online, \url{http://www.random.org}",
  month =        oct,
  year =         1998,
  note =         {checked 2007-05-30}
}

@Article{james:pseudorandom-review,
  author =       "F. James",
  title =        "A Review of Pseudorandom Number Generators",
  journal =      "Computer Physics Communications",
  year =         1990,
  volume =       60,
  pages =        {329--344}
}

@TechReport{Christofides1976,
  author =       "N. Christofides",
  title =        "Worst-case analysis of a new heuristic for the
                  travelling salesman problem",
  institution =  "Graduate School of Industrial Administration,
                  Carnegie Mellon University",
  year =         1976,
  number =       388
}

@TechReport{mars:rng-tr,
  author =       "George Marsaglia and Arif Zaman",
  title =        "Toward a Universal Random Number Generator",
  institution =  "Florida State University",
  year =         1987,
  number =       {FSU-SCRI-87-50}
}

@article{matsumoto1998mtd,
  title =        "{Mersenne Twister}: A 623-Dimensionally
                  Equidistributed Uniform Pseudo-Random Number
                  Generator",
  author =       "Matsumoto, M. and Nishimura, T.",
  journal =      "ACM Transactions on Modeling and Computer
                  Simulation",
  volume =       "8",
  number =       "1",
  pages =        "3-30",
  year =         1998
}

@Misc{unicode5,
  author =       "{The Unicode Consortium}",
  title =        "Unicode Home Page",
  howpublished = "\url{http://unicode.org/}",
  note =         "checked 2007-05-30",
  year =         2006
}

@Misc{GutenbergDVD,
  author =       "{Project Gutenberg Literary Archive Foundation}",
  title =        "July 2006 {Gutenberg} {DVD}",
  howpublished =
                  "\url{http://www.gutenberg.org/wiki/Gutenberg:The_CD_and_DVD_Project}",
  note =         "(Last checked 07-29-2009)",
  year =         2006
}

@Misc{GutenbergDVDs,
  author =       "{Project Gutenberg Literary Archive Foundation}",
  title =        "The {CD} and {DVD} Project",
  howpublished =
                  "\url{http://www.gutenberg.org/wiki/Gutenberg:The_CD_and_DVD_Project}",
  note =         "checked 2007-03-16",
  year =         2006
}

@Misc{GutenbergDVD2003,
  author =       "{Project Gutenberg Literary Archive Foundation}",
  title =        "December 2003 {Gutenberg} {DVD}",
  howpublished =
                  "\url{http://www.gutenberg.org/wiki/Gutenberg:The_CD_and_DVD_Project}",
  note =         "checked 2007-01-12",
  year =         2006
}


@Misc{GutenbergCanada-url,
  title =        "Project {Gutenberg} Canada",
  howpublished = "\url{http://www.gutenberg.ca/}~(checked 06-07-2011)",
  year =         2007
}


@Misc{GutenbergHeaderFooter,
  author =       "{Project Gutenberg Literary Archive Foundation}",
  title =        "Project {Gutenberg} Header How To",
  howpublished =
                  "\url{http://www.gutenberg.org/wiki/Gutenberg:Project_Gutenberg_Header_How-To}",
  note =         "checked 2006-10-17",
  year =         2006
}

@Misc{GutenbergMirror,
  author =       "{Project Gutenberg Literary Archive Foundation}",
  title =        "{Gutenberg}: Mirroring How-To",
  howpublished =
                  "\url{http://www.gutenberg.org/wiki/Gutenberg:Mirroring_How-To}",
  note =         "checked 2007-1-17",
  year =         2006
}

@Misc{GutenMark,
  author =       "Ronald S. Burkey",
  title =        "{GutenMark} Download Page",
  howpublished = "online:
                  \url{http://www.sandroid.org/GutenMark/download.html}",
  year =         2005,
  note =         {last checked 18-01-2007}
}

@article{carter1979uch,
  title =        "Universal Classes of Hash Functions",
  author =       "Carter, L. and Wegman, M. N.",
  journal =      "Journal of Computer and System Sciences",
  volume =       "18",
  number =       "2",
  pages =        "143--154",
  year =         1979
}

@inproceedings{Guha2006,
  author =       "Sudipto Guha and Andrew McGregor and Suresh
                  Venkatasubramanian",
  title =        "Streaming and sublinear approximation of entropy and
                  information distances",
  booktitle =    "SODA'06",
  year =         "2006",
  isbn =         "0-89871-605-5",
  pages =        "733--742",
  location =     "Miami, Florida",
  doi =          "http://doi.acm.org/10.1145/1109557.1109637",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{Chakrabarti2006,
  author =       "Amit Chakrabarti and Khanh Do Ba and
                  S. Muthukrishnan",
  title =        "Estimating Entropy and Entropy Norm on Data Streams",
  booktitle =    "STACS 2006",
  year =         2006
}

@inproceedings{Kearns1994,
  author =       "Michael Kearns and Yishay Mansour and Dana Ron and
                  Ronitt Rubinfeld and Robert E. Schapire and Linda
                  Sellie",
  title =        "On the learnability of discrete distributions",
  booktitle =    "STOC'94",
  year =         "1994",
  isbn =         "0-89791-663-8",
  pages =        "273--282",
  doi =          {http://doi.acm.org/10.1145/195058.195155}
}

@inproceedings{Orlitsky2003,
  title =        "{Always Good Turing}: asymptotically optimal
                  probability estimation",
  author =       "Orlitsky, A. and Santhanam, NP and Zhang, J.",
  booktitle =    "FOCS'03",
  pages =        "179--188",
  year =         2003
}

@inproceedings{755182,
  author =       "David A. McAllester and Robert E. Schapire",
  title =        "On the Convergence Rate of {Good-Turing} Estimators",
  booktitle =    "COLT'00: Proceedings of the Thirteenth Annual
                  Conference on Computational Learning Theory",
  year =         "2000",
  isbn =         "1-55860-703-X",
  pages =        "1--6",
  publisher =    "Morgan Kaufmann Publishers Inc.",
  address =      "San Francisco, CA, USA",
}

@inproceedings{Gibbons2001,
  author =       "Phillip B. Gibbons and Srikanta Tirthapura",
  title =        "Estimating simple functions on the union of data
                  streams",
  booktitle =    "SPAA'01",
  year =         "2001",
  isbn =         "1-58113-409-6",
  pages =        "281--291"
}

@inproceedings{Batu2002,
  author =       "Tugkan Batu and Sanjoy Dasgupta and Ravi Kumar and
                  Ronitt Rubinfeld",
  title =        "The complexity of approximating entropy",
  booktitle =    "STOC'02",
  year =         "2002",
  isbn =         "1-58113-495-9",
  pages =        "678--687",
  location =     "Montreal, Quebec, Canada",
  doi =          "http://doi.acm.org/10.1145/509907.510005",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{nadeau2003pmo,
  title =        "A {Pareto} Model for {OLAP} View Size Estimation",
  author =       "Nadeau, T. P. E. and Teorey, T. J. E.",
  journal =      "Information Systems Frontiers",
  volume =       "5",
  number =       "2",
  pages =        "137--147",
  year =         "2003",
  publisher =    {Springer}
}

@InBook{Kotidis2002,
  author =       "Yannis Kotidis",
  title =        "Handbook of Massive Data Sets",
  chapter =      "Aggregate View Management in Data Warehouses",
  year =         "2002",
  isbn =         "1-4020-0489-3",
  pages =        "711--741",
  publisher =    "Kluwer Academic Publishers",
  address =      "Norwell, MA, USA",
}

@InBook{Johnson2002-dw,
  author =       "Theodore Johnson",
  title =        "Handbook of Massive Data Sets",
  chapter =      "Data Warehousing",
  year =         "2002",
  isbn =         "1-4020-0489-3",
  pages =        "661--710",
  publisher =    "Kluwer Academic Publishers",
  address =      "Norwell, MA, USA",
}

@inproceedings{haas1995sbe,
  title =        "Sampling-Based Estimation of the Number of Distinct
                  Values of an Attribute",
  author =       "Haas, P. J. and Naughton, J. F. and Seshadri, S. and
                  Stokes, L.",
  booktitle =    "VLDB'95",
  pages =        "311--322",
  year =         1995
}

@inproceedings{faloutsos1996msd,
  title =        "Modeling Skewed Distribution Using Multifractals and
                  the 80-20 Law",
  author =       "Faloutsos, C. and Matias, Y. and Silberschatz, A.",
  booktitle =    "VLDB'96",
  pages =        "307--317",
  year =         1996
}

@PhdThesis{Olken1993,
  author =       "F. Olken",
  title =        "Random sampling from databases",
  school =       "UC Berkeley",
  year =         1993
}

@inproceedings{iceberg98,
  author =       "Min Fang and Narayanan Shivakumar and Hector
                  Garcia-Molina and Rajeev Motwani and Jeffrey
                  D. Ullman",
  title =        "Computing Iceberg Queries Efficiently",
  booktitle =    "VLDB'98",
  year =         "1998",
  isbn =         "1-55860-566-5",
  pages =        {299--310}
}

@comment{
     %publisher ="Morgan Kaufmann Publishers Inc.",
 %address ="San Francisco, CA, USA",
    }
@inproceedings{shukla:sem,
  title =        "Storage Estimation for Multidimensional Aggregates
                  in the Presence of Hierarchies",
  author =       "Shukla, A. and Deshpande, P. and Naughton, J. F. and
                  Ramasamy, K.",
  booktitle =    "VLDB'96",
  pages =        "522--531",
  year =         1996
}

@inproceedings{doraisamy2003pia,
  title =        "Position Indexing of Adjacent and Concurrent N-Grams
                  for Polyphonic Music Retrieval",
  author =       "Doraisamy, S. and R{\"u}ger, S.",
  booktitle =    "ISMIR 2003",
  pages =        "227--228",
  year =         2003
}

@article{flajolet1985pca,
  title =        "Probabilistic Counting Algorithms for Data Base
                  Applications",
  author =       "Flajolet, P. and Martin, G. N.",
  journal =      "Journal of Computer and System Sciences",
  volume =       "31",
  number =       "2",
  pages =        "182--209",
  year =         "1985",
  publisher =    {Academic Press, Inc. Orlando, FL, USA}
}

@inproceedings{1073465,
  author =       "Chin-Yew Lin and Eduard Hovy",
  title =        "Automatic evaluation of summaries using N-gram
                  co-occurrence statistics",
  booktitle =    "NAACL'03",
  year =         "2003",
  pages =        "71--78",
  location =     "Edmonton, Canada",
  publisher =    "Association for Computational Linguistics",
  address =      "Morristown, NJ, USA",
}

@inproceedings{droettboom2003cbc,
  title =        "Correcting Broken Characters in the Recognition of
                  Historical Printed Documents",
  author =       "Droettboom, M.",
  booktitle =    "Digital Libraries 2003",
  pages =        "364--366",
  year =         2003
}

@inproceedings{shah2004sem,
  title =        "Storage Estimation of Multidimensional Aggregates in
                  a Data Warehouse Environment",
  author =       "Shah, B. and Ramachandran, K. and Raghavan, V.",
  booktitle =    "Proceedings of the World Multi-Conference on
                  Systemics, Cybernetics and Informatics",
  year =         2004
}

@article{ciaccia2003bca,
  title =        "Bounding the cardinality of aggregate views through
                  domain-derived constraints",
  author =       "Ciaccia, P. and Golfarelli, M. and Rizzi, S.",
  journal =      "Data \& Knowledge Engineering",
  volume =       "45",
  number =       "2",
  pages =        "131--153",
  year =         "2003",
  publisher =    {Elsevier Science Publishers BV Amsterdam, The
                  Netherlands, The Netherlands}
}

@inproceedings{ciaccia2001eca,
  author =       "Paolo Ciaccia and Matteo Golfarelli and Stefano
                  Rizzi",
  title =        "On Estimating the Cardinality of Aggregate Views",
  booktitle =    "DMDW",
  year =         "2001",
  pages =        "12.1--12.10",
  pagescomments ="page numbers are odd, but it seems correct",
  ee =
                  "http://sunsite.informatik.rwth-aachen.de/Publications/CEUR-WS/Vol-39/paper12.pdf",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{cohen2002usc,
  title =        "Unsupervised Segmentation of Categorical Time Series
                  into Episodes",
  author =       "Cohen, P. and Heeringa, B. and Adams, N.",
  booktitle =    "ICDM'02",
  pages =        "99--106",
  year =         2002
}

@article{deshpande2004smm,
  title =        "Selective {Markov} models for predicting {Web} page
                  accesses",
  author =       "Deshpande, M. and Karypis, G.",
  journal =      "ACM Transactions on Internet Technology (TOIT)",
  volume =       "4",
  number =       "2",
  pages =        "163--184",
  year =         "2004",
  publisher =    {ACM Press New York, NY, USA}
}

@inproceedings{jagadeesh2005dma,
  author =       "R. P. Jagadeesh Chandra Bose and S. H. Srinivasan",
  title =        "Data Mining Approaches to Software Fault Diagnosis",
  booktitle =    "RIDE '05",
  year =         "2005",
  isbn =         "0-7695-2390-0",
  pages =        "45--52",
  doi =          "http://dx.doi.org/10.1109/RIDE.2005.9",
  publisher =    "IEEE Computer Society",
  address =      "Washington, DC, USA",
}

@inbook{caropreso2001lie,
  author =       "Maria Fernanda Caropreso and Stan Matwin and
                  Fabrizio Sebastiani",
  chapter =      "A Learner-Independent Evaluation of the Usefulness
                  of Statistical Phrases for Automated Text
                  Categorization",
  title =        "Text Databases \& Document Management: Theory \&
                  Practice",
  year =         "2001",
  isbn =         "1-878289-93-4",
  pages =        "78--102",
  publisher =    "Idea Group Publishing",
  address =      "Hershey, PA, USA",
}

@inproceedings{YuZuzarteSevcik,
  author =       "Xiaohui Yu and Calisto Zuzarte and Kenneth
                  C. Sevcik",
  title =        "Towards estimating the number of distinct value
                  combinations for a set of attributes",
  booktitle =    "CIKM'05",
  year =         "2005",
  isbn =         "1-59593-140-6",
  pages =        "656--663",
  location =     "Bremen, Germany",
  doi =          "http://doi.acm.org/10.1145/1099554.1099719",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{BarYossef2002,
  author =       "Ziv Bar-Yossef and T. S. Jayram and Ravi Kumar and
                  D. Sivakumar and Luca Trevisan",
  title =        "Counting Distinct Elements in a Data Stream",
  booktitle =    "RANDOM'02",
  year =         "2002",
  isbn =         "3-540-44147-6",
  pages =        "1--10",
  ignoreurl =
                  {http://www.almaden.ibm.com/cs/people/siva/papers/f0.ps}
}

@inproceedings{780593,
  author =       "Ziv Bar-Yossef",
  title =        "Sampling lower bounds via information theory",
  booktitle =    "STOC'03",
  year =         "2003",
  isbn =         "1-58113-674-9",
  pages =        "335--344",
  location =     "San Diego, CA, USA",
  doi =          "http://doi.acm.org/10.1145/780542.780593",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{BarYossef2001,
  author =       "Ziv Bar-Yossef and Ravi Kumar and D. Sivakumar",
  title =        "Sampling algorithms: lower bounds and applications",
  booktitle =    "STOC'01",
  year =         "2001",
  isbn =         "1-58113-349-9",
  pages =        "266--275",
  location =     "Hersonissos, Greece",
  doi =          "http://doi.acm.org/10.1145/380752.380810",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{NagaoMori,
  author =       "Makoto Nagao and Shinsuke Mori",
  title =        "A new method of N-gram statistics for large number
                  of n and automatic extraction of words and phrases
                  from large text data of {Japanese}",
  booktitle =    "COLING'94",
  year =         "1994",
  pages =        {611--615}
}

@article{gonnet1990akr,
  title =        "An analysis of the {Karp-Rabin} string matching
                  algorithm",
  author =       "Gonnet, G. H. and Baeza-Yates, R. A.",
  journal =      "Information Processing Letters",
  volume =       "34",
  number =       "5",
  pages =        "271--274",
  year =         "1990",
  publisher =    {Elsevier North-Holland, Inc. Amsterdam, The
                  Netherlands, The Netherlands}
}

@article{karp1987erp,
  title =        "Efficient randomized pattern-matching algorithms",
  author =       "Karp, R. M. and Rabin, M. O.",
  journal =      "IBM Journal of Research and Development",
  volume =       "31",
  number =       "2",
  pages =        "249--260",
  year =         "1987",
  publisher =    {IBM Corp. Riverton, NJ, USA}
}

Unicode Character Standard version 3.2
@article{cohenhash,
  author =       "Jonathan D. Cohen",
  title =        "Recursive hashing functions for n-grams",
  journal =      "ACM Trans. Inf. Syst.",
  volume =       "15",
  number =       "3",
  year =         "1997",
  pages =        "291--320",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{GaoZhang,
  author =       "Jianfeng Gao and Min Zhang",
  title =        "Improving language model size reduction using better
                  pruning criteria",
  booktitle =    "ACL'02: Proceedings of the 40th Annual Meeting on
                  Association for Computational Linguistics",
  year =         "2001",
  pages =        "176--182",
  location =     "Philadelphia, Pennsylvania",
  publisher =    "Association for Computational Linguistics",
  address =      "Morristown, NJ, USA",
}

@inproceedings{KimWhang,
  author =       "Min-Soo Kim and Kyu-Young Whang and Jae-Gil Lee and
                  Min-Jae Lee",
  title =        "n-gram/2L: a space and time efficient two-level
                  n-gram inverted index structure",
  booktitle =    "VLDB'05",
  year =         "2005",
  isbn =         "1-59593-154-6",
  pages =        "325--336",
  location =     "Trondheim, Norway",
  publisher =    "VLDB Endowment",
}

@article{Yannakoudakis1990,
  author =       "E. J. Yannakoudakis and I. Tsomokos and
                  P. J. Hutton",
  owenscomment = "ACM transposed letters in Tsomokos' name",
  title =        "{n-Grams} and their implication to natural language
                  understanding",
  journal =      "Pattern Recogn.",
  volume =       "23",
  number =       "5",
  year =         "1990",
  issn =         "0031-3203",
  pages =        "509--528",
  doi =          "http://dx.doi.org/10.1016/0031-3203(90)90072-S",
  publisher =    "Elsevier Science Inc.",
  address =      "New York, NY, USA",
}

@article{3165,
  author =       "Jeffrey S. Vitter",
  title =        "Random sampling with a reservoir",
  journal =      "ACM Trans. Math. Softw.",
  volume =       "11",
  number =       "1",
  year =         "1985",
  issn =         "0098-3500",
  pages =        "37--57",
  doi =          "http://doi.acm.org/10.1145/3147.3165",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{kit1998vca,
  author =       "Kit, C. and Wilks, Y.",
  title =        "The {Virtual Corpus} approach to deriving n-gram
                  statistics from large scale corpora",
  booktitle =    "Proceedings of 1998 International Conference on
                  Chinese Information Processing",
  year =         "1998",
  pages =        "223--229",
}

@article{Kolonko2006SRS,
  author =       "M. Kolonko and D. Wasch",
  title =        "Sequential reservoir sampling with a nonuniform
                  distribution",
  journal =      "ACM Trans. Math. Softw.",
  volume =       "32",
  number =       "2",
  year =         "2006",
  issn =         "0098-3500",
  pages =        "257--273",
  doi =          "http://doi.acm.org/10.1145/1141885.1141891",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}
@Book{KnuthV1E3,
  author =       "Donald E. Knuth",
  title =        "Fundamental Algorithms",
  volume =       1,
  series =       "The Art of Computer Programming",
  publisher =    "Addison-Wesley",
  year =         { 1997}
}

@Book{Knuth1969,
  author =       "Donald E. Knuth",
  title =        "Seminumerical Algorithms",
  volume =       2,
  series =       "The Art of Computer Programming",
  publisher =    "Addison-Wesley",
  year =         { 1969}
}

@Book{KnuthV3E3,
  author =       "Donald E. Knuth",
  title =        "Searching and Sorting",
  volume =       3,
  series =       "The Art of Computer Programming",
  publisher =    "Addison-Wesley",
  year =         { 1997}
}

@article{198435,
  author =       "Kim-Hung Li",
  title =        "Reservoir-sampling algorithms of time complexity
                  {O(n(1 + log(N/n)))}",
  journal =      "ACM Trans. Math. Softw.",
  volume =       "20",
  number =       "4",
  year =         "1994",
  issn =         "0098-3500",
  pages =        "481--493",
  doi =          "http://doi.acm.org/10.1145/198429.198435",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{Su2000,
  title =        "{WhatNext}: a prediction system for {Web} requests
                  using n-gram sequence models",
  author =       "Su, Z. and Yang, Q. and Lu, Y. and Zhang, H.",
  booktitle =    "Web Information Systems Engineering 2000",
  pages =        "214--221",
  year =         2000
}

@Misc{jfccs174,
  author =       "John Canny",
  title =        "{CS174} Lecture Notes",
  howpublished =
                  "\url{http://www.cs.berkeley.edu/~jfc/cs174/lecs/lec10/lec10.pdf}",
  year =         2002,
  note =         {checked 2007-05-30}
}

@Misc{COS,
  author =       "Frank Ruskey",
  title =        "The (Combinatorial) Object Server",
  howpublished = "\url{http://www.theory.cs.uvic.ca/~cos/cos.html}",
  year =         2006,
  note =         {checked 2010-06-03}
}

@TechReport{KeithKaserLemireTR05001,
  author =       "Steven Keith and Owen Kaser and Daniel Lemire",
  title =        "Analyzing Large Collections of Electronic Text Using
                  {OLAP}",
  institution =  "UNBSJ CSAS",
  year =         "2005",
  month =        "June",
  number =       {TR-05-001}
}

@inproceedings{KaserKeithLemire2006,
  author =       "Owen Kaser and Steven Keith and Daniel Lemire",
  title =        "The {LitOLAP} Project: Data Warehousing with
                  Literature",
  booktitle =    "CaSTA'06",
  year =         "2006",
  url =
                  {http://www.daniel-lemire.com/fr/documents/publications/casta06_web.pdf}
}

@inproceedings{siegel1989ucf,
  title =        "On universal classes of fast high performance hash
                  functions, their time-space tradeoff, and their
                  applications",
  author =       "Siegel, A.",
  booktitle =    "FOCS'89",
  pages =        "20--25",
  year =         1989
}

@inproceedings{durand2003lcl,
  title =        "Loglog counting of large cardinalities",
  author =       "Durand, M. and Flajolet, P.",
  booktitle =    "ESA'03",
  series =       "LNCS",
  volume =       "2832",
  year =         "2003",
  pages =        {605--617}
}

@inproceedings{KeithKaserLemireAPICS2005,
  author =       "Steven Keith and Owen Kaser and Daniel Lemire",
  title =        "Analyzing Large Collections of Electronic Text Using
                  {OLAP}",
  booktitle =    "APICS 2005",
  year =         "2005",
  month =        "October",
  location =     {Wolfville, Canada}
}

@Article{Shannon1948,
  author =       "Claude E. Shannon",
  title =        "A mathematical theory of communications",
  journal =      "Bell Syst. Tech. J",
  year =         {1948}
}

@article{Shannon1948reprint,
  author =       "C. E. Shannon",
  title =        "A mathematical theory of communication",
  journal =      "SIGMOBILE Mob. Comput. Commun. Rev.",
  volume =       "5",
  number =       "1",
  year =         "2001",
  issn =         "1559-1662",
  pages =        "3--55",
  doi =          "http://doi.acm.org/10.1145/584091.584093",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{Losiewicz2000,
  author =       "Paul Losiewicz and Douglas W. Oard and Ronald
                  N. Kostoff",
  title =        "Textual Data Mining to Support Science and
                  Technology Management",
  journal =      "J. Intell. Inf. Syst.",
  volume =       "15",
  number =       "2",
  year =         "2000",
  issn =         "0925-9902",
  pages =        "99--119",
  doi =          "http://dx.doi.org/10.1023/A:1008777222412",
  publisher =    "Kluwer Academic Publishers",
  address =      "Hingham, MA, USA",
}

@inproceedings{Paulus2003,
  title =        "Conventional and periodic n-grams in the
                  transcription of drum sequences",
  author =       "Paulus, JK and Klapuri, AP",
  booktitle =    "ICME'03",
  pages =        "737--740",
  year =         2003
}

@book{jelinek1998sms,
  title =        "Statistical methods for speech recognition",
  author =       "Jelinek, F.",
  year =         "1998",
  publisher =    {MIT Press Cambridge, MA, USA}
}

@inproceedings{Nie2000,
  author =       "Jian-Yun Nie and Jiangfeng Gao and Jian Zhang and
                  Ming Zhou",
  title =        "On the use of words and n-grams for {Chinese}
                  information retrieval",
  booktitle =    "IRAL'00: Proceedings of the Fifth International
                  Workshop on on Information Retrieval with Asian
                  Languages",
  year =         "2000",
  isbn =         "1-58113-300-6",
  pages =        "141--148",
  location =     "Hong Kong, China",
  doi =          "http://doi.acm.org/10.1145/355214.355235",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{dementiev2005bem,
  title =        "Better External Memory Suffix Array Construction",
  author =       "Dementiev, R. and Mehnert, J. and Karkkainen, J. and
                  Sanders, P.",
  booktitle =    "ALENEX05: Workshop on Algorithm Engineering \&
                  Experiments",
  location =     "Vancouver",
  year =         2005
}

@inproceedings{HonSung,
  title =        "Breaking a time-and-space barrier in constructing
                  full-text indices",
  author =       "Hon, W. K. and Sadakane, K. and Sung, W. K.",
  booktitle =    "FOCS'03",
  pages =        "251--260",
  year =         2003
}

@article{whang1990ltp,
  title =        "A Linear-Time Probabilistic Counting Algorithm for
                  Database Applications",
  author =       "Whang, K. Y. U. Y. and Vander-Zanden, B. T. and Taylor, H. M.",
  journal =      "ACM Transactions on Database Systems",
  volume =       "15",
  number =       "2",
  pages =        "208--229",
  year =         1990
}

@TechReport{idc2006,
  author =       "Dan Vesset and Brian McDonough",
  title =        "Analytics and Data Warehousing Software: Competitive
                  Analysis",
  institution =  "Internation Data Group (IDC)",
  year =         2006,
  number =       202603,
  month =        jul
}

@inproceedings{dean2004msd,
  title =        "{MapReduce}: Simplified Data Processing on Large
                  Clusters",
  author =       "Dean, J. and Ghemawat, S.",
  booktitle =     "OSDI 2004",
  year =         2004
}

@inproceedings{chan1998bid,
  title =        "Bitmap index design and evaluation",
  author =       "Chan, C. Y. and Ioannidis, Y. E.",
  booktitle =      "SIGMOD'98",
  pages =        "355--366",
  year =         "1998"}

@article{dehne2006cpo,
  title =        "The {cgmCUBE} project: Optimizing parallel data cube
                  generation for {ROLAP}",
  author =       "Dehne, F. B. and Eavis, T. B. and Rau-Chaplin, A. B.",
  journal =      "Distributed and Parallel Databases",
  volume =       "19",
  number =       "1",
  pages =        "29--62",
  year =         "2006",
  publisher =    {Springer}
}

@Misc{TelcorPatent,
  author =       "Francis L. Bacon and Donald J. Houde",
  title =        "Data Compression Apparatus and Method",
  howpublished = "US Patent 4612532",
  year =         1984,
  note =         {filed 1984; granted 1986. Assignee Telebyte (later
                  Telcor Systems)}
}

@Article{joul:llc-attribution06,
  author =       "Patrick Joula and John Sofko and Patrick Brennan",
  title =        "A Prototype for Authorship Attribution Studies",
  journal =      llc,
  year =         2006,
  volume =       21,
  number =       2,
  pages =        {169--178}
}

@InProceedings{kese:CNG-method-entry,
  author =       "V. Keselj and N. Cercone",
  title =        "{CNG} Method with Weighted Voting",
  booktitle =    "ad-hoc Authorship Attribution Contest",
  year =         2004,
  editor =       "P. Joula",
  organization = {AHC/ALLC}
}

@Book{weis:dsaaj,
  author =       "M. Weiss",
  title =        "Data Structures and Algorithm Analysis in Java",
  publisher =    "Addison Wesley",
  year =         1999
}

@Misc{j15doc:String,
  author =       "{Sun Microsystems}",
  title =        "{String (Java 2 Platform SE 5.0)}",
  howpublished = "online documentation:
                  \url{http://java.sun.com/j2se/1.5.0/docs/api/index.html}",
  year =         2004
}

@Misc{sary-home,
  author =       "Satoru Takabayashi",
  title =        "Sary: A Suffix Array Library and Tools",
  howpublished = "online: \url{http://sary.sourceforge.net/}",
  month =        mar,
  year =         2005,
  note =         {checked 2007-05-30}
}

@Misc{sufary-home,
  author =       "Tatsuo Yamashita",
  title =        "{SUFARY}",
  howpublished = "online: \url{http://nais.to/~yto/tools/sufary}",
  month =        jan,
  year =         2005,
  note =         {checked 2007-05-30}
}

@article{morenoifpl2005,
  author =       "Eduardo Moreno",
  title =        "De Bruijn Sequences and De Bruijn Graphs for a
                  General Language",
  journal =      {to appear in Information Processing Letters}
}

@inproceedings{564415,
  author =       "Dirk Bahle and Hugh E. Williams and Justin Zobel",
  title =        "Efficient phrase querying with an auxiliary index",
  booktitle =    "SIGIR '02: Proceedings of the 25th annual
                  international ACM SIGIR conference on Research and
                  development in information retrieval",
  year =         "2002",
  isbn =         "1-58113-561-0",
  pages =        "215--221",
  location =     "Tampere, Finland",
  doi =          "http://doi.acm.org/10.1145/564376.564415",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}






@article{179818,
  author =       "Avrim Blum and Tao Jiang and Ming Li and John Tromp
                  and Mihalis Yannakakis",
  title =        "Linear approximation of shortest superstrings",
  journal =      "J. ACM",
  volume =       "41",
  number =       "4",
  year =         "1994",
  issn =         "0004-5411",
  pages =        "630--647",
  doi =          "http://doi.acm.org/10.1145/179812.179818",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Article{Kaplan2005,
  author =       "Haim Kaplan and Nira Shafrir",
  title =        "The greedy algorithm for shortest superstrings",
  journal =      "Information Processing Letters",
  year =         "2005",
  volume =       "93",
  number =       "1",
  pages =        {13--17}
}

@inproceedings{961569,
  author =       "Lawrence D'Antonio",
  title =        "Incorporating bioinformatics in an algorithms
                  course",
  booktitle =    "ITiCSE '03: Proceedings of the 8th annual conference
                  on Innovation and technology in computer science
                  education",
  year =         "2003",
  isbn =         "1-58113-672-2",
  pages =        "211--214",
  location =     "Thessaloniki, Greece",
  doi =          "http://doi.acm.org/10.1145/961511.961569",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{320218,
  author =       "Udi Manber and Gene Myers",
  title =        "Suffix arrays: a new method for on-line string
                  searches",
  booktitle =    "SODA '90",
  year =         "1990",
  isbn =         "0-89871-251-3",
  pages =        "319--327",
  location =     "San Francisco, California, United States",
  publisher =    "Society for Industrial and Applied Mathematics",
  address =      "Philadelphia, PA, USA",
}

@article{1082039,
  author =       "Paolo Ferragina and Giovanni Manzini",
  title =        "Indexing compressed text",
  journal =      "J. ACM",
  volume =       "52",
  number =       "4",
  year =         "2005",
  issn =         "0004-5411",
  pages =        "552--581",
  doi =          "http://doi.acm.org/10.1145/1082036.1082039",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Article{suffix-array-journal,
  author =       "Udi Manber and Gene Myers",
  title =        "Suffix arrays: a new method for on-line string
                  searches",
  journal =      "SIAM Journal on Computing",
  year =         1993,
  volume =       22,
  number =       5,
  pages =        {935--948}
}

@inproceedings{775061,
  author =       "Jon Kleinberg",
  title =        "Bursty and hierarchical structure in streams",
  booktitle =    "KDD '02",
  year =         "2002",
  isbn =         "1-58113-567-X",
  pages =        "91--101",
  location =     "Edmonton, Alberta, Canada",
  doi =          "http://doi.acm.org/10.1145/775047.775061",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{Syntex2005,
  author =       "D. Bourigault and C. Fabre and C. Fr{\"{\i}?`}ot and
                  M.-P. Jacques and S. Ozdowska",
  title =        "Syntex, analyseur syntaxique de corpus",
  booktitle =    "Actes des 12{\"{\i}?`e}s journ{\"{\i}?`s} sur le
                  Traitement Automatique des Langues Naturelles",
  year =         "2005",
  ignoreurl =
                  {http://www.univ-tlse2.fr/erss/membres/bourigault/TALN05-bourigault-Syntex.pdf}
}

@Article{Syntex2000,
  author =       "D. Bourigault and C. Fabre",
  title =        "Approche linguistique pour l'analyse syntaxique de
                  corpus",
  journal =      "Cahiers de Grammaires",
  year =         "2000",
  number =       "25",
  pages =        {131--151}
}

@Misc{VeronisTagCloud,
  author =       "Jean {V\"{\i}?`onis}",
  title =        " Blogs: Banlieues dans les nuages",
  howpublished =
                  "\url{http://aixtal.blogspot.com/2005/11/blogs-banlieues-dans-les-nuages.html}",
  month =        "November",
  year =         2005
}

@Misc{TreeTagger,
  author =       "Achim Stein",
  title =        "TreeTagger -- a language independent part-of-speech
                  tagger",
  howpublished =
                  "\url{http://www.ims.uni-stuttgart.de/projekte/corplex/TreeTagger/DecisionTreeTagger.html}",
  month =        "September",
  year =         2005
}

@Misc{Wordnet,
  author =       "George A. Miller and Christiane Fellbaum and Randee
                  Tengi and Susanne Wolff and Pamela Wakefield and
                  Helen Langone and Benjamin Haskell",
  title =        "Wordnet -- a lexical database for the {English}
                  language",
  howpublished = "\url{http://wordnet.princeton.edu/}",
  note =         "checked 2006-10-17"
}

@InProceedings{lazysuffixtrees,
  author =       "R. Giegerich and S. Kurtz and J. Stoye",
  title =        "Efficient implementation of lazy suffix trees",
  booktitle =    "WAE'99",
  pages =        "30--42",
  year =         1999
}

@article{375365,
  author =       "Gonzalo Navarro",
  title =        "A guided tour to approximate string matching",
  journal =      "ACM Comput. Surv.",
  volume =       "33",
  number =       "1",
  year =         "2001",
  issn =         "0360-0300",
  pages =        "31--88",
  doi =          "http://doi.acm.org/10.1145/375360.375365",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Article{Myers1994,
  author =       "E. Myers",
  title =        "A sublinear algorithm for approximate keyword
                  searching",
  journal =      "Algorithmica",
  year =         "1994",
  volume =       "12",
  number =       "4/5",
  pages =        {345--374}
}

@inproceedings{738434,
  author =       "Erkki Sutinen and Jorma Tarhio",
  title =        "Filtration with q-Samples in Approximate String
                  Matching",
  booktitle =    "CPM '96: Proceedings of the 7th Annual Symposium on
                  Combinatorial Pattern Matching",
  year =         "1996",
  isbn =         "3-540-61258-0",
  pages =        "50--63",
  publisher =    "Springer-Verlag",
  address =      "London, UK",
}

@InProceedings{NavarroSutinen2000,
  author =       "G. Navarro and E. Sutinen and J. Tanninen and
                  J. Tarhio",
  title =        "Indexing text with approximate q-grams",
  booktitle =    "CPM'2000",
  pages =        "350--363",
  year =         2000
}

@article{958828,
  author =       "Stefan Burkhardt and Juha K\&\#228;rkk\&\#228;inen",
  title =        "Better filtering with gapped q-grams",
  journal =      "Fundam. Inf.",
  volume =       "56",
  number =       "1,2",
  year =         "2003",
  issn =         "0169-2968",
  pages =        "51--70",
  publisher =    "IOS Press",
  address =      "Amsterdam, The Netherlands, The Netherlands",
}

@inproceedings{graycube,
  author =       "J. Gray and A. Bosworth and A. Layman and
                  H. Pirahesh",
  title =        "Data Cube: A Relational Aggregation Operator
                  Generalizing Group-By, Cross-Tab, and Sub-Total",
  booktitle =    "ICDE '96",
  year =         "1996",
  pages =        {152--159}
}

@TechReport{codd93,
  author =       "E. F. Codd",
  title =        "Providing {OLAP} (on-line analytical processing) to
                  user-analysis: an {IT} mandate",
  institution =  "E. F. Codd and Associates",
  year =         "1993",
}

@inproceedings{882090,
  author =       "B. Wang and F. Pan and D. Ren and Y. Cui and Q. Ding
                  and W. Perrizo",
  title =        "Efficient {OLAP} operations for spatial data using
                  {Peano} trees",
  booktitle =    "DMKD '03",
  year =         "2003",
  pages =        "28--34",
  location =     "San Diego, California",
  doi =          "http://doi.acm.org/10.1145/882082.882090",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Article{moth:doccube,
  author =       {Josiane Mothe and Claude Chrisment and Bernard
                  Dousset and Joel Alaux},
  title =        {{DocCube}: Multi-Dimensional Visualization and
                  Exploration of Large Document Sets},
  journal =      jasist,
  year =         2003,
  volume =       54,
  number =       7,
  pages =        {650--659}
}

@inproceedings{345656,
  author =       "M. C. McCabe and J. Lee and A. Chowdhury and
                  D. Grossman and O. Frieder",
  title =        "On the design and evaluation of a multi-dimensional
                  approach to information retrieval",
  booktitle =    "SIGIR '00",
  year =         "2000",
  isbn =         "1-58113-226-3",
  pages =        "363--365",
  location =     "Athens, Greece",
  doi =          "http://doi.acm.org/10.1145/345508.345656",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Book{Sullivan2001,
  publisher =    "John Wiley \& Sons",
  title =        "Document Warehousing and Text Mining: Techniques for
                  Improving Business Operations, Marketing, and Sales",
  author =       "D. Sullivan",
  year =         2001
}

@Article{niem:mddata-model-informetrics,
  author =       "Timo Niemi and Lasse Hirvonen and Kalerva
                  J{\"a}rvelin",
  title =        {Multidimensional Data Model and Query Language for
                  Informetrics},
  journal =      jasist,
  year =         2003,
  volume =       54,
  number =       10,
  pages =        {939--951}
}

@Article{bern:a-juste-titre,
  author =       "Michel Bernard",
  title =        "\textit{{\`A} juste titre}: A Lexicometric Approach
                  to the Study of Titles",
  journal =      llc,
  year =         1995,
  volume =       10,
  number =       2,
  pages =        {135--141}
}

@inproceedings{KeyKaserLemireAPICS2005,
  author =       "Steven Keith and Owen Kaser and Daniel Lemire",
  title =        "Analyzing Large Collections of Electronic Text Using
                  {OLAP}",
  booktitle =    "APICS 2005",
  year =         "2005",
  month =        "October",
  location =     "Wolfville, Canada",
  ignoreurl =
                  {http://www.daniel-lemire.com/fr/documents/publications/apics05-web.pdf}
}

@Article{KoAluru2003,
  author =       "Pang Ko and Srinivas Aluru",
  title =        "Space Efficient Linear Time Construction of Suffix
                  Arrays",
  journal =      "Lecture Notes in Computer Science",
  year =         2003,
  volume =       2676,
  pages =        {200--210}
}

@Article{ManziniFerragina,
  author =       "G. Manzini and P. Ferragina",
  title =        "Engineering a lightweight suffix array construction
                  algorithm",
  journal =      "Algorithmica",
  year =         2004,
  volume =       40,
  pages =        {33--50}
}

@inproceedings{fisher05,
  author =       "Johannes Fischer and Volker Heun and Stefan Kramer",
  title =        "Fast Frequent String Mining Using Suffix Arrays",
  booktitle =    "ICDM'05",
  year =         "2005",
  location =     "Houston, Texas",
  ignoreurl =    {http://cgi.bio.ifi.lmu.de/~fischer/fischer05fast.ps}
}

@Book{McHugh1989,
  Author =       "James A. M. McHugh",
  title =        "Algorithmic Graph Theory",
  publisher =    "Prentice-Hall",
  year =         "1989",
  ignoreurl =
                  {http://www.cs.njit.edu/mchugh/psswrd/web-course-materials/graph-theory/alg-graph-theory-text-pdf/}
}

@Book{thul:graphbook,
  AUTHOR =       "K. Thulasiraman and M. N. S. Swamy",
  TITLE =        "Graphs: Theory and Algorithms",
  PUBLISHER =    "John Wiley and Sons",
  YEAR =         1992,
  ADDRESS =      "New York"
}

@article{322150,
  author =       "Greg N. Frederickson",
  title =        "Approximation Algorithms for Some Postman Problems",
  journal =      "J. ACM",
  volume =       "26",
  number =       "3",
  year =         "1979",
  issn =         "0004-5411",
  pages =        "538--554",
  doi =          "http://doi.acm.org/10.1145/322139.322150",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{ChangPoon2006,
  author =       "M. Chang and C. K. Poon",
  title =        "Efficient Phrase Querying with Common Phrase
                  Indexing",
  booktitle =    "ECIR'06",
  year =         2006
}

@article{Zobel1998,
  author =       "J. Zobel and A. Moffat and K. Ramamohanarao",
  title =        "Inverted files versus signature files for text
                  indexing",
  journal =      "ACM Transactions on Database Systems",
  volume =       "23",
  number =       "4",
  pages =        "453--490",
  year =         1998
}

@InProceedings{Zobel2002,
  author =       "D. Bahle and H. E. Williams and J. Zobel",
  title =        "Efficient phrase querying with an auxiliary index",
  booktitle =    "SIGIR'02",
  year =         2002
}

@inproceedings{1060785,
  author =       "Xiaohui Long and Torsten Suel",
  title =        "Three-level caching for efficient query processing
                  in large {Web} search engines",
  booktitle =    "WWW'05",
  year =         "2005",
  isbn =         "1-59593-046-9",
  pages =        "257--266",
  location =     "Chiba, Japan",
  doi =          "http://doi.acm.org/10.1145/1060745.1060785",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@TechReport{viewsizetechreport,
  author =       "Daniel Lemire and Owen Kaser",
  title =        "One-Pass, One-Hash n-Gram Count Estimation",
  institution =  "Dept. of CSAS, UNBSJ",
  number =       "TR-06-001",
  year =         "2006",
  note =         {Available from
                  \url{http://arxiv.org/abs/cs.DB/0610010}}
}

@article{cai1995umd,
  title={Using multiset discrimination to solve language processing problems without hashing},
  author={Cai, J. and Paige, R.},
  journal={Theoretical Computer Science},
  volume={145},
  number={1-2},
  pages={189--228},
  year={1995},
  publisher={Elsevier}
}


@TechReport{0605103,
  author =       "Daniel Lemire",
  title =        "A Better Alternative to Piecewise Linear Time Series
                  Segmentation",
  institution =  "arxiv.org",
  number =       "cs.DB/0605103",
  year =         2006
}



@InCollection{275705,
 author = {M. F. Porter},
 title = {An Algorithm for Suffix Stripping},
 booktitle = {Readings in information retrieval},
 year = {1997},
 publisher = {Morgan Kaufmann},
 pages = {313--316}
 }


@comment{lemi:one-pass-conference,
  author =       "Daniel Lemire and Owen Kaser",
  title =        "One-Pass, One-Hash $n$-Gram Count Estimation",
  note =         "stripped down version is under review as lemi:one-pass-conference-stripped",
  year =         2006
}

@comment{lemi:one-pass-conference-stripped,
  author =       "Daniel Lemire and Owen Kaser",
  title =        "Recursive N-gram Hashing is Pairwise Independent, at Best",
  note =         "Under review", 
  comment =      "by Elsevier Computer Speech and Language",
  year =         2009
}

@Article{lemi:one-pass-journal,
  author =       "Daniel Lemire and Owen Kaser",
  title =        "Recursive N-gram Hashing is Pairwise Independent, at Best",
  journal =      "Computer Speech and Language",
  year =         2010,
  volume =       24,
  number =       4,
  pages =        "698--710",
  month =        oct,
  comment =      "publication announced April 2010"}

@Unpublished{pinarunpublished,
  author =       "G. Canahuate and H. Ferhatosmanoglu and A. Pinar",
  title =        "Improving bitmap index compression by data reorganization",
  note =         "\url{http://hpcrd.lbl.gov/~apinar/papers/TKDE06.pdf}~(checked 2008-12-15)",
  year =         2006
}

 @Misc{pinarunpublished---fr,
   author =       "G. Canahuate and H. Ferhatosmanoglu and A. Pinar",
   title =        "Improving bitmap index compression by data reorganization",
  howpublished = "En ligne~: \url{http://hpcrd.lbl.gov/~apinar/papers/TKDE06.pdf}",
  note =         "Dernier acc\`es le 12 f\'evrier 2008",
   year =         2006
 }

@misc{goog:all-our-ngram,
  author =       "Alex Franz and Thorsten Brants",
  title =        "All Our N-Gram are Belong to You",
  howpublished = "in the Google Research Blog,
                  \url{http://googleresearch.blogspot.com/2006/08/all-our-n-gram-are-belong-to-you.html}",
  month =        "March",
  year =         2006,
  note =         {checked 2006-08-09}
}

@Misc{tapo:betatools,
  author =       "{TAPoR Project}",
  title =        "{TAPoR} Prototype of Text Analysis Tools",
  howpublished = "online:
                  \url{http://taporware.mcmaster.ca/~taporware/betaTools/index.shtml}",
  year =         2005,
  note =         {checked 2006-06-27}
}

@MastersThesis{keit:mcs-unb,
  author =       "Steven W. Keith",
  title =        "Efficient Storage Methods for a Literary Data
                  Warehouse",
  school =       "UNB",
  year =         2006
}

@Misc{mondrian,
  author =       "Julian Hyde",
  title =        "Mondrian",
  howpublished = "online: \url{http://mondrian.sourceforge.net}",
  note =         {checked 2006-06-27}
}

@Misc{mondrian-pentaho,
  author =    {Pentaho},
  title =     {Pentaho Analysis Service: Mondrian Project},
  howpublished = {online: \url{http://mondrian.pentaho.org}},
  note =      {checked 2009-09-19}}

@Misc{oreilly-warstories,
  author =       "Dare Obasanjo",
  title =        "{O'Reilly} Database War Stories Highlights",
  howpublished = "online,
                  \url{http://www.25hoursaday.com/weblog/PermaLink.aspx?guid=cbdad3fb-ddce-4f72-bc75-f0cace39a1ae}",
  month =        jun,
  year =         2006,
  note =         {checked 2006-06-27}
}

@Article{TurneyML,
  author =       "P. D. Turney and M. L. Littman",
  title =        "Corpus-Based Learning of Analogies and Semantic
                  Relations",
  journal =      "Machine Learning",
  year =         2005,
  volume =       60,
  number =       "1--3",
  pages =        {251--278}
}

@Article{StubbsConrad2005,
  author =       "Michael Stubbs",
  title =        "Conrad in the computer: examples of quantitative
                  stylistic methods",
  journal =      "Language and Literature",
  year =         "2005",
  OPTvolume =    "14",
  OPTnumber =    "1",
  OPTpages =     {5--24}
}

@Book{Leed1966,
  editor =       "J. Leed",
  title =        "The Computer and Literary Style",
  publisher =    "Kent State University press",
  year =         "1966",
  city =         "Kent",
  state =        "Ohio",
  country =      {USA}
}

@InProceedings{unsworth2004,
  author =       "John Unsworth",
  title =        "Forms of Attention: Digital Humanities Beyond
                  Representation",
  booktitle =    "CaSTA 2004",
  city =         "Hamilton",
  province =     "Ontario",
  country =      "Canada",
  month =        "November",
  year =         "2004",
  organization = "McMaster University",
  url =          {http://www3.isrl.uiuc.edu/~unsworth/FOA/}
}

@InProceedings{ramsay2005,
  author =       "Stephen Ramsay",
  title =        "Mining {Shakespeare}",
  booktitle =    "ACH/ALLC 2005",
  city =         "Victoria",
  province =     "British Columbia",
  country =      "Canada",
  month =        "June",
  year =         "2005",
  organization = "University of Victoria",
  url =
                  {http://mustard.tapor.uvic.ca:8080/cocoon/ach_abstracts/proof/session_208_ruecker.pdf}
}

@Article{craig1999,
  author =       "Hugh Craig",
  title =        "Authorial Attribution and Computational Stylistics:
                  if you can tell authors apart, have you learned
                  anything about them?",
  journal =      llc,
  year =         "1999",
  volume =       14
}

@inproceedings{992763,
  author =       "E. Stamatatos and N. Fakotakis and G. Kokkinakis",
  title =        "Text genre detection using common word frequencies",
  booktitle =    "Proceedings of the 17th conference on Computational
                  linguistics",
  year =         "2000",
  isbn =         "1-555-55555-1",
  pages =        "808--814",
  location =     "Saarbr\\~{A}cken, Germany",
  publisher =    "Association for Computational Linguistics",
  address =      "Morristown, NJ, USA",
}

@inproceedings{977055,
  author =       "Maria Wolters and Mathias Kirsten",
  title =        "Exploring the use of linguistic features in domain
                  and genre classification",
  booktitle =    "Proceedings of the ninth conference on European
                  chapter of the Association for Computational
                  Linguistics",
  year =         "1999",
  pages =        "142--149",
  location =     "Bergen, Norway",
  publisher =    "Association for Computational Linguistics",
  address =      "Morristown, NJ, USA",
}

@Book{Foster2001,
  author =       "D. Foster",
  title =        "Author unknown -- on the trail of Anonymous",
  publisher =    "Macmillan",
  year =         "2001",
  city =         {London}
}

@comment{datacube,
 author="Jim  Gray and Surajit  Chaudhuri and Adam  Bosworth and Andrew  Layman and Don  Reichart and Murali  Venkatrao and Frank  Pellow and Hamid  Pirahesh",
 title= "Data Cube: A Relational Aggregation Operator Generalizing Group-By, Cross-Tab, and Sub-Totals",
 journal="Data Mining and Knowledge Discovery",
 volume="1",
 number="1",
 pages="29--53",
 year="1997",
 month="March"
}
@article{autoatt1,
  author =       "J. Diederich and J. Kindermann and E. Leopold and
                  Gerhard Paass",
  title =        "Authorship Attribution with Support Vector Machines",
  journal =      "Applied Intelligence",
  volume =       "19",
  issue =        "1 - 2",
  month =        "July",
  year =         "2003",
  pages =        "109--123"
}

@article{autoatt2,
  author =       "E. Stamatatos and N. Fakotakis and G. Kokkinakis",
  title =        "Computer-Based Authorship Attribution Without
                  Lexical Measures",
  journal =      "Computers and the Humanities",
  volume =       "35",
  issue =        "2",
  month =        "May",
  year =         "2001",
  pages =        "193--214"
}

@article{autoatt3,
  author =       "H. Baayen and H. van Halteren and A. Neijt and
                  F. Tweedi",
  title =        "An experiment in authorship attribution",
  journal =      "Journees Internationales d'Analyse Statistique des
                  Donnees Textuelles",
  year =         "2002"
}

@article{vocabmeasure,
  author =       "F. J. Tweedie and R. H. Baayen",
  title =        " How Variable May a Constant be? Measures of Lexical
                  Richness in Perspective",
  journal =      "Computers and the Humanities",
  volume =       "32",
  issue =        "5",
  year =         "1998",
  pages =        "323--352"
}

@comment{month="September",}
@Book{foster1,
  author =       "D. Foster",
  title =        "Author Unknown: on the trail of Anonymous",
  publisher =    "Henry Holt and Company, LLC",
  address =      "New York, New York, USA",
  year =         2000
}

@Book{foster2,
  author =       "D. Foster",
  title =        "Elegy by W. S.",
  publisher =    "Associated University Presses",
  address =      "Mississauga, Ontario, Canada",
  year =         1989
}

@inproceedings{882090,
  author =       "B. Wang and F. Pan and D. Ren and Y. Cui and Q. Ding
                  and W. Perrizo",
  title =        "Efficient {OLAP} operations for spatial data using
                  {Peano} trees",
  booktitle =    "DMKD '03",
  year =         "2003",
  pages =        "28--34",
  location =     "San Diego, California",
  doi =          "http://doi.acm.org/10.1145/882082.882090",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Article{Mendenhall,
  author =       "T. Mendenhall",
  title =        "The Characteristic Curves of Composition",
  journal =      "Science",
  volume =       "IX",
  pages =        "237-249",
  year =         "1887"
}

@TechReport{Turney-Littman-report,
  author =       "P. D. Turney and M. L. Littman",
  title =        "Learning Analogies and Semantic Relations",
  institution =  "National Research Council, Institute for Information
                  Technology",
  year =         "2003",
  key =          "ERB-1103",
}

@Book{SQLServerMDX2005,
  author =       "S. Harinath and S. R. Quinn",
  title =        "Professional {SQL} Server Analysis Services 2005
                  with MDX",
  publisher =    "Wrox",
  year =         2005
}

@Misc{MDX,
  author =       "Microsoft",
  title =        "{MDX}",
  howpublished = "online:
                  \url{http://www.microsoft.com/sqlserver/2008/en/us/wp-sql-2008-analysis-services.aspx}",
  year =         "2008",
  note =         "Analysis Services Overview, (Last checked 07-29-2009)",
 
}

@Misc{SatorBase,
  author =       "{Soci\'{e}t\'{e} d'analyse
                  de la topique romanesque}",
  title =        "{SatorBase}",
  howpublished = "http://www.satorbase.org/",
  note =         "checked 2006-10-17",
  year =         2005
}

@Misc{Blogpulse,
  author =       "Intelliseek",
  title =        "Blogpulse",
  howpublished = "http://www.blogpulse.com/",
  year =         2005
}

@Article{stylometry,
  author =       "F. Can and J. Patton",
  title =        "Change of Writing Style with Time",
  journal =      "Computers and the Humanities",
  year =         "2004",
  volume =       "38",
  number =       "1",
  pages =        "61--82",
  month =        {February}
}

@article{767151,
  author =       "Alon Y. Halevy",
  title =        "Answering queries using views: A survey",
  journal =      "The VLDB Journal",
  volume =       "10",
  number =       "4",
  year =         "2001",
  issn =         "1066-8888",
  pages =        "270--294",
  doi =
                  "http://dx.doi.org/10.1007/s007780100054",
  publisher =    "Springer-Verlag New York, Inc.",
  address =      "Secaucus, NJ, USA",
}

@article{641272,
  author =       "Rada Chirkova and Alon Y. Halevy and Dan Suciu",
  title =        "A formal perspective on the view selection problem",
  journal =      "The VLDB Journal",
  volume =       "11",
  number =       "3",
  year =         "2002",
  issn =         "1066-8888",
  pages =        "216--237",
  doi =
                  "http://dx.doi.org/10.1007/s00778-002-0070-0",
  publisher =    "Springer-Verlag New York, Inc.",
  address =      "Secaucus, NJ, USA",
}

@Article{chak:graph-mining-surveys,
  author =       "D. Chakrabarti and C. Faluoutsos",
  title =        "Graph Mining: Laws, Generators, and Algorithms",
  journal =      csur,
  year =         2006,
  volume =       38,
  pages =        "1--69",
  note =         {Article 2}
}

@misc{liu:montylingua,
  author =       "Hugo Liu",
  title =        "{MontyLingua}: An end-to-end natural language
                  processor with common sense",
  year =         2004,
  howpublished =
                  "online. \url{http://web.media.mit.edu/~hugo/montylingua}",
  note =         "checked 2006-10-25"
}

@InProceedings{lloy:newspapers-vs-blogs,
  author =       "Levon Lloyd and Prachi Kaulgud and Steven Skiena",
  title =        "Newspapers vs Blogs: Who Gets the Scoop",
  booktitle =    "Computational Approaches to Analyzing Weblogs
                  (AAAI-CAAW)",
  year =         2006,
  month =        mar,
  organization = "AAAI",
  anothernote =  "skiena says to cite his IEEE TVCG paper for heat
                  maps",
  note =         {online:
                  \url{http://www.algorithm.cs.sunysb.edu/lloyd/mypapers/blog_paper.pdf},
                  checked 2006-11-22}
}

@Article{mehl:spatial-analysis-news,
  author =       { Andrew Mehler and Yunfan Bao and Xin Li and Yue
                  Wang and Steven Skiena},
  title =        "Spatial Analysis of News Sources",
  journal =      "IEEE Trans. Visualization and Computer Graphics",
  year =         2006,
  volume =       12,
  pages =        {765--772}
}

@InProceedings{hass:improving-tag-clouds,
  author =       "Yussef {Hassan-Montero} and Victor {Herrero-Solana}",
  title =        "Improving Tag-Clouds as Visual Information Retrieval
                  Interfaces",
  booktitle =    {InSciT'06},
  year =         {2006}
}

@Article{kenn:force-directed,
  author =       "Andrew Kennings and Kristofer P. Vorwerk",
  title =        "Force-Directed Methods for Generic Placement",
  journal =      tcad,
  year =         2006,
  volume =       25,
  number =       10,
  pages =        "2076--2087"
}

@inproceedings{shi:optimal-slicing,
  author =       "Weiping Shi",
  title =        "An Optimal Algorithm for Area Minimization of
                  Slicing Floorplans",
  booktitle =    "ACM/IEEE International Conference on Computer-Aided
                  Design (ICCAD)",
  year =         "1995",
  Omitisbn =     "0-8186-7213-7",
  pages =        "480--484",
  doi =
                  "http://doi.ieeecomputersociety.org/10.1109/ICCAD.1995.480160",
  Omitpublisher ="IEEE Computer Society",
  Omitaddress =  "Los Alamitos, CA, USA",
}

@inproceedings{mura:rectangle-packing-placement,
  author =       "H. Murata and K. Fujiyoshi and S. Nakatake and
                  Y. Kajitani",
  title =        "Rectangle-Packing-Based Module Placement",
  booktitle =    "ACM/IEEE International Conference on Computer-Aided
                  Design (ICCAD)",
  year =         "1995",
  isbn =         "0-8186-7213-7",
  pages =        "472--479",
  doi =
                  "http://doi.ieeecomputersociety.org/10.1109/ICCAD.1995.480159",
  publisher =    "IEEE Computer Society",
  address =      "Los Alamitos, CA, USA",
}

@InProceedings{otte:floorplan-dac82,
  author =       "Ralph H. J. M Otten",
  title =        "Automatic Floorplan Design",
  booktitle =    "19th Design Automation Conference",
  pages =        "261--267",
  year =         1982,
  note =         {also subject of US patent 4554625}
}

@Article{stoc:orientation-floorplan,
  author =       "Larry Stockmeyer",
  title =        "Optimal Orientation of Cells in Slicing Floorplan
                  Designs",
  journal =      "Information and Control",
  year =         1983,
  volume =       57,
  number =       {2--3}
}

@Article{cong:lookahead-bipartitioning,
  author =       "Jason Cong and Michail Romesis and Joseph
                  R. Shinnerl",
  title =        {Fast Floorplanning by Look-Ahead Enabled Recursive
                  Bipartitioning},
  journal =      tcad,
  year =         2006,
  volume =       25,
  number =       9,
  pages =        {1719--1732}
}

@Article{knut:breaking-paragraphs,
  author =       "Donald E. Knuth and Michael F. Plass",
  title =        "Breaking Paragraphs into Lines",
  journal =      "Software --- Practice \& Experience",
  year =         1982,
  volume =       11,
  number =       11,
  pages =        {1119-1184}
}

@Book{knut:tex,
  author =       "Donald E. Knuth",
  title =        "The \TeX book",
  publisher =    "Addison-Wesley",
  year =         1984
}

@Book{gare:gandj,
  AUTHOR =       "Michael R. Garey and David S. Johnson",
  TITLE =        "Computers and Intractability: A Guide to the Theory
                  of {NP}-Completeness",
  PUBLISHER =    "W. H. Freeman",
  YEAR =         1979,
  ADDRESS =      "New York"
}

@Misc{cres:online-compendium,
  author =       "Pierluigi Crescenzi and Viggo Kann",
  title =        "A Compendium of {NP} Optimization Problems",
  howpublished = "online at
                  http://www.nada.kth.se/$\sim$viggo/wwwcompendium/",
  note =         {accessed 27 Nov 2006}
}

@inproceedings{Korn:2000:ISB:342009.335415,
 author = {Korn, Flip and Muthukrishnan, S.},
 title = {Influence sets based on reverse nearest neighbor queries},
 booktitle = {Proceedings of the 2000 ACM SIGMOD international conference on Management of data},
 series = {SIGMOD '00},
 year = {2000},
 isbn = {1-58113-217-4},
 location = {Dallas, Texas, United States},
 pages = {201--212},
 numpages = {12},
 url = {http://doi.acm.org/10.1145/342009.335415},
 doi = {http://doi.acm.org/10.1145/342009.335415},
 acmid = {335415},
 publisher = {ACM},
 address = {New York, NY, USA},
} 
[download]

@InProceedings{schi:rect-packing-esa,
  author =       "Ingo Schiermeyer",
  title =        "Reverse Fit: A 2-Optimal Algorithm for Packing
                  Rectangles",
  booktitle =    "Proceedings, 2nd Ann. European Symposium on
                  Algorithms (ESA)",
  pages =        "290--299",
  year =         1994,
  number =       855,
  series =       "Lecture Notes in Computer Science",
  publisher =    {Springer-Verlag}
}

@InProceedings{keny:strip-packing-focs,
  author =       "Claire Keynon and Eric R\'emila",
  title =        "Approximate Strip Packing",
  booktitle =    {Proceedings, 37th Annual IEEE Symposium on the
                  Foundations of Computer Science},
  pages =        "31--36",
  publisher =    "IEEE Computer Society",
  year =         1996
}

@article{DBLP:journals/mor/KenyonR00,
  author =       {Claire Kenyon and Eric R{\'e}mila},
  title =        {A Near-Optimal Solution to a Two-Dimensional Cutting
                  Stock Problem},
  journal =      "Math. Oper. Res.",
  volume =       25,
  number =       4,
  year =         2000,
  pages =        "645--656",
  ee =           "http://dx.doi.org/10.1287/moor.25.4.645.12118",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@article{lodi2002tdp,
  title =        "Two-dimensional packing problems: A survey",
  author =       "Lodi, A. and Martello, S. and Monaci, M.",
  journal =      "European Journal of Operational Research",
  volume =       "141",
  number =       "2",
  pages =        "241--252",
  year =         "2002",
  publisher =    {Elsevier Science}
}

@Article{coff:level-oriented,
  author =       "Edward G. {Coffman, Jr.} and Michael R. Garey and
                  David S. Johnson and Robert E. Tarjan",
  title =        "Performance Bounds for Level-Oriented
                  Two-Dimensional Packing Algorithms",
  journal =      "SIAM J. Comput.",
  year =         1980,
  volume =       9,
  number =       4,
  pages =        {808--826}
}

@misc{valenzuela-heuristics,
  author =       "Christine L. Valenzuela and Pearl Y. Wang",
  title =        "Heuristics for Large Strip Packing Problems with
                  Guillotine Patterns: an Empirical Study",
  year =         2001,
  note =
                  {\url{citeseer.ist.psu.edu/valenzuela01heuristics.html}. checked 2006-11-28}
}

@InProceedings{zhan:fixed-die,
  author =       "Yong Zhan and Yan Feng and Sachin S. Sapatnekar",
  title =        "A Fixed-die Floorplanning Algorithm Using an
                  Analytical Approach",
  booktitle =    "Proceedings, Asia-South Pacific Design Automation
                  Conference",
  pages =        "771--776",
  year =         2006
}

@InProceedings{dubi:tags-over-time,
  author =       "Micah Dubinko and Ravi Kumar and Joseph Magnani and
                  Jasmine Novak and Prabhakar Raghavan and Andrew
                  Tomkins",
  title =        "Visualizing Tags over Time",
  booktitle =    "15th International World Wide Web Conference",
  pages =        "193--202",
  publisher =    "ACM Press New York, NY, USA",
  year =         2006
}

@Misc{shaw:semidefinite-folksonomies-proposal,
  author =       "Blake Shaw",
  title =        "Semidefinite Embedding Applied to Visualizing
                  Folksonomies",
  howpublished = "CS6772 Project Proposal, Columbia University",
  month =        "dec",
  year =         2005,
  note =         {online:
                  \url{http://www.metablake.com/advml/adv-ml-project.pdf},
                  checked 30 November 2006}
}

@misc{ CategoryTagging,
  author =       "Michael Woehrer",
  title =        "{Category Tagging} --- A {WordPress} Plugin",
  year =         "2006",
  url =
                  "\url{http://sw-guide.de/wordpress/category-tagging-plugin/}",
  note =         "[Online; accessed 17-January-2007]"
}

@book{coupland1996m,
  title =        "Microserfs",
  author =       "Coupland, D.",
  year =         "1996",
  publisher =    {Flamingo}
}

@misc{ wiki:tag-cloud,
  author =       "Wikipedia",
  title =        "Tag Cloud --- {W}ikipedia{,} The Free Encyclopedia",
  year =         "2004",
  url =
                  "\url{http://en.wikipedia.org/w/index.php?title=Tag_cloud&oldid=98381481}",
  note =         "[Online; accessed 4-January-2007]"
}



@misc{ wiki:bitmapindex,
  author =       "Wikipedia",
  title =        "Bitmap Index --- {W}ikipedia{,} The Free Encyclopedia",
  year =         "2008",
  url =
                  "\url{http://en.wikipedia.org/w/index.php?title=Bitmap_index&oldid=213738023}",
  note =         "[Online; accessed 26-May-2008]"
}

@misc{ wikipedia,
  author =       "Wikimedia Foundation, Inc.",
  title =        "Wikipedia, the free encyclopedia",
  year =         "2001",
  url =          "\url{http://en.wikipedia.org/}",
  note =         "[Online; accessed 8-May-2007]"
}

@misc{ wiki:birthday-paradox,
  author =       "Wikipedia",
  title =        "Birthday Paradox --- {W}ikipedia{,} The Free
                  Encyclopedia",
  year =         "2007",
  url =
                  "\url{http://en.wikipedia.org/w/index.php?title=Birthday_Paradox}",
  note =         "[Online; accessed 18-01-2007]"
}

@misc{ zoomclouds,
  author =       "{AR Networks}",
  title =        "{ZoomClouds}",
  year =         "2007",
  url =          "\url{http://www.zoomclouds.com/}",
  note =         "[Online; accessed 22-01-2007]"
}

@misc{ flickr,
  author =       "{Yahoo! Inc.}",
  title =        "Flickr",
  year =         "2007",
  url =          "\url{http://www.flickr.com/}",
  note =         "[Online; accessed 22-01-2007]"
}

@misc{swivel,
  author =	     "{Swivel, Inc}",
  title =        "Swivel",
  year =         2007,
  howpublished =          "\url{http://www.swivel.com}",
  note =         "[Online; accessed 7-6-2007]"
}

@misc{cistidrillclouds,
  author = {Glen Newton},
  title = {Drill Clouds},
  year={2007},
  url="\url{http://lab.cisti.nrc.gc.ca/cistilabswiki/index.php/Drill_Clouds}",
  note = "[Online; accessed 4-10-2007]"
}



@article{butler2007dsn,
  title =        "Data sharing: the next generation",
  author =       "Butler, D.",
  journal =      "Nature",
  volume =       "446",
  number =       "7131",
  pages =        "1--10",
  year =         2007
}

@misc{manyeyes,
  author =       "{IBM}",
  title =        "{Many Eyes}",
  year =         "2007",
  howpublished =          "\url{http://services.alphaworks.ibm.com/manyeyes/}",
  note =         "[Online; accessed 7-6-2007]"
}

@misc{ del.icio.us,
  author =       "{Yahoo! Inc.}",
  title =        "del.icio.us",
  year =         "2007",
  url =          "\url{http://del.icio.us/}",
  note =         "[Online; accessed 22-01-2007]"
}

@misc{ technorati,
  author =       "{Technorati Inc.}",
  title =        "Technorati",
  year =         "2007",
  url =          "\url{http://technorati.com/}",
  note =         "[Online; accessed 22-01-2007]"
}

@misc{ amazontagclouds,
  author =       "{Amazon.com}",
  title =        "Amazon Tag Clouds",
  year =         "2007",
  url =          "\url{http://www.amazon.com/gp/tagging/cloud}",
  note =         "[Online; accessed 15-05-2007]"
}

@misc{ oreillytagclouds,
  author =       "{O'Reilly Media}",
  title =        "Content Statistics",
  year =         "2007",
  url =          "\url{http://labs.oreilly.com/stats/}",
  note =         "[Online; accessed 15-05-2007]"
}

@Misc{FASMI,
  author =       "N. Pendse",
  title =        "What Is {OLAP}?",
  howpublished = "\url{http://www.olapreport.com/fasmi.htm}",
  note =         "[Online; accessed 22-01-2007]",
  institution =  "The {OLAP} Report",
  year =         1995
}

@article{corm:whats-hot,
  author =       "G. Cormode and S. Muthukrishnan",
  title =        "What's Hot and What's Not: Tracking Most Frequent
                  Items Dynamically",
  journal =      "ACM Trans. Database Syst.",
  volume =       "30",
  number =       "1",
  year =         "2005",
  issn =         "0362-5915",
  pages =        "249--278",
  doi =          "http://doi.acm.org/10.1145/1061318.1061325",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@InProceedings{dema:freq-est-esa02,
  author =       "Erik D. Demaine and Alejandro {L\'opez-Ortiz} and
                  J. Ian Munro",
  title =        "Frequency Estimation of Internet Packet Streams with
                  Limited Space",
  booktitle =    "Proceedings of ESA-2002, LNCS 2461",
  pages =        "348--360",
  year =         2002,
  publisher =    {Springer-Verlag}
}

@InProceedings{iked:text-from-templates,
  author =       "Daisuke Ideda and Yasuhiro Yamada",
  title =        "Gathering Text Files Generated from Templates",
  booktitle =    "IIWeb Workshop, VLDB-2004",
  year =         2004
}

@Misc{weas:weasel-reader-home,
  author =       "John Grunenfelder",
  title =        "Weasel Reader: Free Reading",
  howpublished = "online: \url{http://gutenpalm.sourceforge.net/}",
  year =         2006,
  note =         {last checked 18-01-2007}
}

@Misc{atki:newgut-software,
  author =       "Tyler Atkins",
  title =        "Newgut program",
  howpublished = "online:
                  \url{http://rumkin.com/reference/gutenberg/newgut}",
  year =         2004,
  note =         {last checked 18-01-2007}
}

@Article{flaj:approx-counting,
  author =       "Philippe Flajolet",
  title =        "Approximate Counting: A Detailed Analysis",
  journal =      "BIT",
  year =         1985,
  volume =       25,
  pages =        {113--134}
}

@article{morr:approx-counting,
  author =       "Robert Morris",
  title =        "Counting large numbers of events in small registers",
  journal =      "Commun. ACM",
  volume =       21,
  number =       10,
  year =         1978,
  issn =         "0001-0782",
  pages =        "840--842",
  doi =          "http://doi.acm.org/10.1145/359619.359627",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{DBLP:journals/scp/MisraG82,
  author =       {Jayadev Misra and David Gries},
  title =        "Finding Repeated Elements.",
  journal =      "Sci. Comput. Program.",
  volume =       2,
  number =       2,
  year =         1982,
  pages =        "143-152",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@article{karp:repeats03,
  author =       "Richard M. Karp and Scott Shenker and Christos
                  H. Papadimitriou",
  title =        "A simple algorithm for finding frequent elements in
                  streams and bags",
  journal =      "ACM Trans. Database Syst.",
  volume =       "28",
  number =       "1",
  year =         "2003",
  issn =         "0362-5915",
  pages =        "51--55",
  doi =          "http://doi.acm.org/10.1145/762471.762473",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@Book{skie:algs-design-manual,
  author =       "Steven S. Skiena",
  title =        "The Algorithm Design Manual",
  publisher =    "Springer-Verlag",
  year =         1998
}

@book{dibattista1999gda,
  title =        "Graph drawing: algorithms for the visualization of
                  graphs",
  author =       "Di Battista, G. and others",
  year =         "1999",
  publisher =    {Prentice Hall}
}

@article{purchase2000eiv,
  title =        "Effective information visualisation: a study of
                  graph drawing aesthetics and algorithms",
  author =       "Purchase, HC",
  journal =      "Interacting with Computers",
  volume =       "13",
  number =       "2",
  pages =        "147--162",
  year =         "2000",
  publisher =    {Elsevier}
}

@MastersThesis{Bielenberg2005,
  author =       "Kai Bielenberg and Marc Zacher",
  title =        "Groups in Social Software: Utilizing Tagging to
                  Integrate Individual Contexts for Social Navigation",
  school =       "Universit{\"a}t Bremen",
  year =         2005
}

@InProceedings{hurs:tighter-tables,
  author =       "Nathan Hurst and Kim Marriott and Peter Moulder",
  title =        "Toward Tighter Tables",
  booktitle =    "Proceedings, DocEng'05",
  year =         2005
}

@inproceedings{hurst:continuous,
  author =       "Nathan Hurst and Kim Marriott and David Albrecht",
  title =        "Solving the simple continuous table layout problem",
  booktitle =    "Proceedings, DocEng '06",
  year =         "2006",
  pages =        {28--30}
}

@Misc{css3-text,
  author =       "E. J. {Etemad (Editor)}",
  title =        "{CSS3} Text Effects Module",
  note =         "W3C Working Draft 27 June 2005",
  howpublished = "\url{http://www.w3.org/TR/css3-text/}, last checked
                  on 24/01/2007",
  institution =  "W3C",
  year =         2005
}


@Misc{css3-fonts,
  author =       "Michel Suignard and Chris {Lilley (editors)}",
  title =        "{CSS3} Module: Fonts",
  note =         "W3C Working Draft 2 August 2002",
  howpublished = "\url{http://www.w3.org/TR/css3-fonts/}, last checked
                  on 28/01/2007",
  institution =  "W3C",
  year =         2005
}

@Misc{sneep2005,
  author =       "M. Sneep",
  title =        "A short comparison of various typesetting engines",
  howpublished =
                  "\begin{small}\url{http://www.nat.vu.nl/~sneep/ars/type/comparison.pdf}\end{small}, last checked on 24/01/2007",
  year =         2005
}

@inproceedings{1141859,
  author =       "T. Russell",
  title =        "cloudalicious: folksonomy over time",
  booktitle =    "JCDL'06",
  year =         "2006",
  isbn =         "1-59593-354-9",
  pages =        {364--364}
}

@inproceedings{1124792,
  author =       "D. R. Millen and J. Feinberg and B. Kerr",
  title =        "Dogear: Social bookmarking in the enterprise",
  booktitle =    "CHI '06",
  year =         "2006",
  pages =        {111--120}
}

@inproceedings{1149949,
  author =       "C. Marlow and M. Naaman and D. Boyd and M. Davis",
  title =        "HT06, tagging paper, taxonomy, Flickr, academic
                  article, to read",
  booktitle =    "HYPERTEXT'06",
  year =         "2006",
  isbn =         "1-59593-417-0",
  pages =        "31--40",
  location =     "Odense, Denmark",
  doi =          "http://doi.acm.org/10.1145/1149941.1149949",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@inproceedings{1178692,
  author =       "A. Jaffe and M. Naaman and T. Tassa and M. Davis",
  title =        "Generating summaries and visualization for large
                  collections of geo-referenced photographs",
  booktitle =    "MIR '06",
  year =         "2006",
  pages =        {89--98}
}

@article{1105676,
  author =       "D. Millen and J. Feinberg and B. Kerr",
  title =        "Social bookmarking in the enterprise",
  journal =      "Queue",
  volume =       "3",
  number =       "9",
  year =         "2005",
  issn =         "1542-7730",
  pages =        {28--35}
}

@Incollection{zimm:topdown,
  AUTHOR =       "Gerhard Zimmermann",
  TITLE =        "Top--Down Design of Digital Systems",
  BOOKTITLE =    "Advances in CAD for VLSI, Volume 2: Logic Design and
                  Simulation",
  EDITOR =       "E. Horbst",
  PUBLISHER =    "North--Holland",
  YEAR =         1986,
  PAGES =        "9--30"
}

@Inproceedings{zimm:estimation,
  AUTHOR =       "Gerhard Zimmerman",
  TITLE =        "A New Area and Shape Function Estimation Technique
                  for {VLSI} Layouts",
  BOOKTITLE =    dac88,
  YEAR =         1988,
  PAGES =        "60--65"
}

@Inproceedings{leng:robust,
  AUTHOR =       "Thomas Lengauer and Rolf Muller",
  TITLE =        "A Robust Framework for Hierarchical Floorplanning
                  with Integrated Global Wiring",
  BOOKTITLE =    iccad90,
  YEAR =         1990,
  OMITNOTE =     "Also report 70, Dept. of Math. and CS, U. Paderborn",
  PAGES =        "148--151"
}

@TechReport{leng:floorplanning-complexity,
  AUTHOR =       "Thomas Lengauer and Rolf Muller",
  TITLE =        "The Complexity of Floorplanning Based on Binary
                  Circuit Partitions",
  INSTITUTION =  "Fachbereich Mathematik--Informatik, U. Paderborn,
                  Germany",
  YEAR =         1987,
  NUMBER =       46
}

@Inproceedings{mcfa:evaluation,
  AUTHOR =       "Michael C. {McFarland, SJ}",
  TITLE =        "A Fast Floor Planning Algorithm for Architectural
                  Evaluation",
  BOOKTITLE =    iccd89,
  YEAR =         1989,
  PAGES =        "96--99"
}

@Book{leng:combinatorial,
  AUTHOR =       "Thomas Lengauer",
  TITLE =        "Combinatorial Algorithms for Integrated Circuit
                  Layout",
  PUBLISHER =    "John Wiley and Sons",
  YEAR =         1990,
  ADDRESS =      "New York"
}

@InProceedings{fidu:FM,
  author =       "C. M. Fiduccia and R. M. Mattheyses",
  title =        "A Linear-Time Heuristic for Improving Network
                  Partitions",
  booktitle =    dac82,
  year =         1982
}

@Article{kirk:simulated-annealing-science,
  author =       "S. Kirkpatrick and C. D. {Gelatt, Jr} and
                  M. P. Vecchi",
  title =        "Optimization by Simulated Annealing",
  journal =      "Science",
  year =         1983,
  volume =       220,
  pages =        "671-680"
}

@Article{brue:mincut-placement,
  author =       "Melvin A. Bruer",
  title =        "Min-cut Placement",
  journal =      "Journal of Design Automation and Fault-Tolerant
                  Computing",
  year =         1977,
  volume =       1,
  number =       4,
  pages =        {343--362}
}

@article{DBLP:journals/tcad/RoyAPM06,
  author =       "Jarrod A. Roy and Saurabh N. Adya and David A. Papa
                  and Igor L. Markov",
  title =        "Min-cut floorplacement",
  journal =      "IEEE Trans. on CAD of Integrated Circuits and
                  Systems",
  volume =       "25",
  number =       "7",
  year =         "2006",
  pages =        "1313-1326",
  ee =
                  "http://doi.ieeecomputersociety.org/10.1109/TCAD.2005.855969",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@Book{holl:genetic-algorithms,
  author =       "John H. Holland",
  title =        "Adaptation in Natural and Artificial Systems",
  publisher =    "University of Michigan Press",
  year =         1975
}

@Book{bulw:caxtons,
  author =       "Edward {Bulwer-Lytton}",
  title =        "The Caxtons",
  publisher =    "Project Gutenberg",
  note =         " e-book number 7605, file b033w10.txt",
  year =         1849
}

@Book{rode:anglo-russian,
  author =       "Theophilus F. Rodenbough",
  title =        "Afghanistan and the Anglo-Russian Dispute",
  publisher =    "Project Gutenberg; originally G. P. Putnam's Sons",
  note =         "e-book number 7320, file aaard10.txt",
  year =         1885
}

@article{DBLP:journals/spe/AtkinsonG06,
  author =       "Darren C. Atkinson and William G. Griswold",
  title =        "Effective pattern matching of source code using
                  abstract syntax patterns",
  journal =      "Softw., Pract. Exper.",
  volume =       "36",
  number =       "4",
  year =         "2006",
  pages =        "413-447",
  ee =           "http://dx.doi.org/10.1002/spe.704",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@InProceedings{chan:blobb-and-compass,
  author =       "Hayward Chan and Igor L. Markov",
  title =        "Practical Slicing and Non-slicing Block Packing
                  without Simulated Annealing",
  booktitle =    "Proceedings, Great Lakes Symposium on VLSI",
  pages =        "282--287",
  year =         2004,
  note =         "see also
                  \url{http://vlsicad.eecs.umich.edu/BK/BLoBB/}"
}

@Article{fruc:force-graph-drawing,
  author =       "Thomas M. J. Fruchterman and Edward M. Reingold",
  title =        "Graph Drawing by Force-directed Placement",
  journal =      "Software --- Practice and Experience",
  year =         1991,
  volume =       21,
  number =       11,
  pages =        {1129--1164}
}

@InProceedings{eade:force,
  title =        "A Heuristic for Graph Drawing",
  year =         1984,
  booktitle =    "Congressus Numeratium",
  author =       "P. Eades",
  pages =        {149--160}
}

@Article{dunl:placement,
  AUTHOR =       "Alfred E. Dunlop and Brian W. Kernighan",
  TITLE =        "A Procedure for Placement of Standard-Cell {VLSI}
                  Circuits",
  JOURNAL =      tcad,
  VOLUME =       4,
  YEAR =         1985,
  MONTH =        jan,
  PAGES =        "92--98"
}

@inproceedings{1193309,
  author =       "Daria Sorokina and Johannes Gehrke and Simeon Warner
                  and Paul Ginsparg",
  title =        "Plagiarism Detection in {arXiv}",
  booktitle =    "ICDM '06: Proceedings of the Sixth International
                  Conference on Data Mining",
  year =         "2006",
  isbn =         "0-7695-2701-9",
  pages =        "1070--1075",
  doi =          "http://dx.doi.org/10.1109/ICDM.2006.126",
  publisher =    "IEEE Computer Society",
  address =      "Washington, DC, USA",
}

@inproceedings{li2004cmt,
  title =        "{CP-Miner}: A tool for finding copy-paste and
                  related bugs in operating system code",
  author =       "Li, Z. and Lu, S. and Myagmar, S. and Zhou, Y.",
  booktitle =    "Proceedings of the Sixth Symposium on Operating
                  System Design and Implementation",
  pages =        "289--302",
  year =         2004
}

@inproceedings{kim2005fct,
  title =        "When Functions Change Their Names: Automatic
                  Detection of Origin Relationships",
  author =       "Kim, S. and Pan, K. and Whitehead Jr, EJ",
  booktitle =    "Reverse Engineering",
  pages =        "143--152",
  year =         2005
}

@inproceedings{segal2004sea,
  title =        "{SpamGuru}: An Enterprise Anti-Spam Filtering
                  System",
  author =       "Segal, R. and Crawford, J. and Kephart, J. and
                  Leiba, B.",
  booktitle =    "Proceedings of the First Conference on E-mail and
                  Anti-Spam",
  year =         2004
}

@inproceedings{winnowing,
  title =        "{Winnowing}: local algorithms for document
                  fingerprinting",
  author =       "Schleimer, S. and Wilkerson, D. S. and Aiken, A.",
  booktitle =    "SIGMOD'2003",
  pages =        "76--85",
  year =         2003
}

@article{hoover2001,
  journal =      llc,
  year =         "2001",
  volume =       16,
  number =       4,
  pages =        "421--444",
  title =        { Statistical Stylistics and Authorship Attribution:
                  an Empirical Investigation},
  author =       {David L. Hoover}
}

@inproceedings{Gibson2005,
  author =       "David Gibson and Kunal Punera and Andrew Tomkins",
  title =        "The volume and evolution of web page templates",
  booktitle =    "WWW '05",
  year =         "2005",
  pages =        {830--839}
}

@inproceedings{511522,
  author =       "Ziv Bar-Yossef and Sridhar Rajagopalan",
  title =        "Template detection via data mining and its
                  applications",
  booktitle =    "WWW '02",
  year =         "2002",
  pages =        {580--591}
}

@inproceedings{1141534,
  author =       "Liang Chen and Shaozhi Ye and Xing Li",
  title =        "Template detection for large scale search engines",
  booktitle =    "SAC '06",
  year =         "2006",
  pages =        {1094--1098}
}

@inproceedings{1067065,
  author =       "Sandip Debnath and Prasenjit Mitra and C. Lee Giles",
  title =        "Automatic extraction of informative blocks from
                  webpages",
  booktitle =    "SAC '05",
  year =         "2005",
  pages =        {1722--1726}
}

@inproceedings{ji2005mmd,
  title =        "Mining Minimal Distinguishing Subsequence Patterns
                  with Gap Constraints",
  author =       "Ji, X. and Bailey, J. and Dong, G.",
  booktitle =    "ICDM'05",
  pages =        "194--201",
  year =         2005
}

@misc{gute:2007newsletter5,
  author =       "Mike Cook",
  title =        "{Project Gutenberg} Weekly Newsletter --- Week
                  \#05-2007",
  howpublished = "online,
                  \url{http://www.gutenberg.org/newsletter/archive/PGWeekly_2007_02_07.txt}",
  note =         "last checked 2007-02-27",
  year =         2007
}

@inproceedings{dp2003,
  title =        "Distributed proofreading",
  author =       "Newby, G. B. and Franks, C.",
  booktitle =    "Digital Libraries 2003",
  pages =        "27--31",
  year =         2003
}

@Misc{sort2005,
  author =       "Rober Ramey",
  title =        "2005 Performance/Price Sort and PennySort",
  howpublished = "online,
                  \url{http://research.microsoft.com/barc/SortBenchmark/2005_PostMansSort.pdf}",
  month =        "April",
  year =         2005
}

@inproceedings{1096605,
  author =       "H. D\'ejean and J.-L. Meunier",
  title =        "Structuring documents according to their table of
                  contents",
  booktitle =    "DocEng '05",
  year =         "2005",
  pages =        {2--9}
}

@article{DBLP:journals/ijdar/LinX06,
  author =       "X. Lin and Y. Xiong",
  title =        "Detection and analysis of table of contents based on
                  content association",
  journal =      "IJDAR",
  volume =       "8",
  number =       "2-3",
  year =         "2006",
  pages =        {132--143}
}

@article{taghva1996emb,
  title =        "Evaluation of Model-Based Retrieval Effectiveness
                  with {OCR} Text",
  author =       "Taghva, K. and Borsack, J. and Condit, A.",
  journal =      "ACM Transactions on Information Systems",
  volume =       "14",
  number =       "1",
  pages =        "64--93",
  year =         1996
}

@inproceedings{lin2006qah,
  title =        "Quality Assurance in High Volume Document
                  Digitization: A Survey",
  author =       "Lin, X.",
  booktitle =    "DIAL'06",
  pages =        "312--319",
  year =         2006
}

@inproceedings{aouicheiceis2007,
  author =       "K. Aouiche and D. Lemire",
  title =        "Unassuming View-Size Estimation Techniques in
                  {OLAP}",
  booktitle =    "ICEIS'07",
  year =         "2007",
  pages =        {145--150}
}

@Book{grah:concrete,
  author =       "Ronald L. Graham and Donald E. Knuth and Oren
                  Patashnik",
  title =        "Concrete Mathematics",
  publisher =    "Addison-Wesley",
  year =         1989
}

@inproceedings{gol98met,
  author =       "Matteo Golfarelli and Stefano Rizzi",
  title =        "A Methodological Framework for Data Warehouse
                  Design",
  booktitle =    "DOLAP'98",
  year =         "1998",
  pages =        {3--9}
}

@article{car75ana,
  author =       "Alfonso F. Cardenas",
  title =        "Analysis and Performance of Inverted Data Base
                  Structures",
  journal =      "Communication of the {ACM}",
  volume =       "18",
  number =       "5",
  year =         "1975",
  pages =        {253--263}
}

@article{yao77app,
  author =       "S. B. Yao",
  title =        "Approximating Block Accesses in Database
                  Organizations",
  journal =      "Communication of the {ACM}",
  volume =       "20",
  number =       "4",
  year =         "1977",
  pages =        {260--261}
}

@article{transpos2005,
  author =       "J. Gray",
  title =        "A Measure of Transaction Processing -- 20 Years
                  Later",
  journal =      "IEEE Data Engineering Bulletin",
  year =         2005
}

@inproceedings{gup97sel,
  author =       "Himanshu Gupta",
  title =        "Selection of Views to Materialize in a Data
                  Warehouse",
  booktitle =    "{ICDT'97}",
  pages =        "98--112",
  year =         1997
}

@Misc{DBGEN,
  author =       "{Transaction Processing Performance Council}",
  title =        "{DBGEN} 2.4.0",
  Removedurl =          "{http://www.tpc.org/tpch/}",
  howpublished = "\url{http://www.tpc.org/tpch/} (Last checked 07-29-2009)",
  year =         2006
}


@Misc{DBGEN---fr,
  author =       "{TPC}",
  title =        "{DBGEN} 2.4.0",
  Removedurl =          "{http://www.tpc.org/tpch/}",
  howpublished = "En ligne~: \url{http://www.tpc.org/tpch/}",
  note =         "Dernier acc\`es le 4 d\'ecembre 2007",
  institution =  "Transaction Processing Performance Council",
  year =         2006
}

@Misc{KDDRepository,
  author =       "S. Hettich and S. D. Bay",
  title =        "The {UCI} {KDD} archive",
  howpublished = "\url{http://kdd.ics.uci.edu} (Last checked 06-09-2010)",
  institution =  "University of California, Irvine",
  year =         "2000"
}



@Misc{KDDRepository---fr,
  author =       "S. Hettich and S. D. Bay",
  title =        "The {UCI} {KDD} archive",
  howpublished = "En ligne~: \url{http://kdd.ics.uci.edu}",
  note= "Dernier acc\`es le 21 d\'ecembre 2007",
  institution =  "University of California, Irvine",
  year =         2000
}

@INPROCEEDINGS{adbis06ajd,
  Author =       "K. Aouiche and P. Jouve and J. Darmont",
  Title =        "Clustering-Based Materialized View Selection in Data
                  Warehouses",
  Booktitle =    "ADBIS'06",
  Year =         "2006",
  Series =       "LNCS",
  Volume =       "4152",
  Pages =        {81--95}
}

@inproceedings{237823,
  author =       "N. Alon and Y. Matias and M. Szegedy",
  title =        "The space complexity of approximating the frequency
                  moments",
  booktitle =    "STOC '96",
  year =         "1996",
  pages =        {20--29}
}

@inproceedings{cormode2005sam,
  title =        "Summarizing and mining skewed data streams",
  author =       "Cormode, G. and Muthukrishnan, S.",
  booktitle =    "SDM'05",
  year =         2005
}

@inproceedings{manku2002afc,
  title =        "Approximate frequency counts over data streams",
  author =       "Manku, G. S. and Motwani, R.",
  booktitle =    "VLDB'02",
  pages =        "346--357",
  year =         2002
}

@inproceedings{wu2007,
  author =       "Ping Wu and Yannis Sismanis and Berthold Reinwald",
  title =        "Towards Keyword-Driven Analytical Processing",
  booktitle =    "SIGMOD '07",
  pages = {617--628},
  year =         2007
}

@inproceedings{halv:tag-presentation-assessment,
  author =       "Martin Halvey and Mark T. Keane",
  title =        "An Assessment of Tag Presentation Techniques",
  booktitle =    "Proceedings, WWW 2007",
  year =         2007
}

@inproceedings{1240781,
  author =       "Jeffrey Heer and Fernanda B. Vi\'egas and Martin
                  Wattenberg",
  title =        "Voyagers and voyeurs: supporting asynchronous
                  collaborative information visualization",
  booktitle =    "CHI '07",
  year =         "2007",
  pages =        {1029--1038}
}

@inproceedings{manyeyes2008,
  author =       "F.B. Vi\'egas and M. Wattenberg and M. McKeon and F. van Ham and and J. Kriss",
  title =        "Harry Potter and the meat-filled freezer: A case study of spontaneous usage of visualization tools",
  booktitle =    "HICSS 2008",
  year =         "2008",
  pages =        {1--10}
}

@article{wattenberg2006dsd,
  title =        "Designing for Social Data Analysis",
  author =       "Wattenberg, M. and Kriss, J.",
  journal =      "IEEE Transactions on Visualization and Computer
                  Graphics",
  volume =       "12",
  number =       "4",
  pages =        "549--557",
  year =         2006
}

@inproceedings{583891,
  author =       "Mathurin Body and Maryvonne Miquel and Yvan B\'edard
                  and Anne Tchounikine",
  title =        "A multidimensional and multiversion structure for
                  {OLAP} applications",
  booktitle =    "DOLAP '02",
  year =         "2002",
  pages =        {1--6}
}

@inproceedings{morzy2004qvm,
  title =        "On querying versions of multiversion data warehouse",
  author =       "Morzy, T. and Wrembel, R.",
  booktitle =      "DOLAP '04",
  pages =        "92--101",
  year =         2004
}

@inproceedings{kaser2007,
  author =       "Owen Kaser and Daniel Lemire",
  title =        "Tag-Cloud Drawing: Algorithms for Cloud
                  Visualization",
  booktitle =    "WWW 2007 -- Tagging and Metadata for Social
                  Information Organization",
  year =         2007
}

@comment{http://www.infoworld.com/article/03/06/02/22NNbi_1.html}
@article{Havenstein2003,
  author =       "Heather Havenstein",
  title =        "{BI} vendors seek to tap end-user power: New class
                  of tools built to reap user knowledge for
                  customizing analytic applications",
  journal =      "InfoWorld",
  year =         2003,
  volume =       22,
  pages =        "20--21"
}

@inproceedings{xmlolap,
  title =        " {XML}-extended {OLAP} querying",
  author =       "Pedersen, D. and Riis, K. and Pedersen, T. B.",
  booktitle =    "SSDM 2002",
  year =         2002,
  pages =        {195--206}
}

@inproceedings{veltkamp2001sms,
  title =        "Shape matching: similarity measures and algorithms",
  author =       "Veltkamp, RC",
  booktitle =    "SMI 2001",
  pages =        "188--197",
  year =         2001
}

@INPROCEEDINGS{hdimolap,
  author =       "Xiaolei Li and Jiawei Han and Hector Gonzalez",
  title =        "High-Dimensional {OLAP}: A Minimal Cubing Approach",
  booktitle =    "VLDB'04",
  year =         "2004",
  url =          "http://www.cs.uiuc.edu/~hanj/pdf/vldb04_hdolap.pdf"
}

@inproceedings{DBLP:conf/vldb/BurdickDJRV05,
  author =     "Douglas Burdick and Prasad Deshpande and
                  T. S. Jayram and Raghu Ramakrishnan and Shivakumar
                  Vaithyanathan",
  title =        "{OLAP} Over Uncertain and Imprecise Data",
  booktitle =    "VLDB'05",
  year =         "2005",
  pages =        "970--981",
  obsolete =     "see burd:olap-imprecise-vldbj",
  url =
                  {http://www.vldb2005.org/program/paper/fri/p970-burdick.pdf}
}


@Article{burd:olap-imprecise-vldbj,
  author =     "Douglas Burdick and Prasad Deshpande and
                  T. S. Jayram and Raghu Ramakrishnan and Shivakumar
                  Vaithyanathan",
  title =        "{OLAP} Over Uncertain and Imprecise Data",
  journal =      {The {VLDB} J.},
  year =         2007,
  volume =    16,
  number =    1,
  pages =     {123--144}}

@article{1093388,
 author = {Hurtado, Carlos A. and Gutierrez, Claudio and Mendelzon, Alberto O.},
 title = {Capturing summarizability with integrity constraints in {OLAP}},
 journal = {ACM Trans. Database Syst.},
 volume = {30},
 number = {3},
 year = {2005},
 issn = {0362-5915},
 pages = {854--886},
 doi = {http://doi.acm.org/10.1145/1093382.1093388},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@inproceedings{wong1985btf,
  title =        "Bit transposed files",
  author =       "Wong, H. K. T. and Liu, H. F. and Olken, F. and Rotem,
                  D. and Wong, L.",
  booktitle =    "VLDB '85",
  pages =        "448--457",
  year =         1985
}

@inproceedings{chan1999ebe,
  title =        "An efficient bitmap encoding scheme for selection
                  queries",
  author =       "Chan, C. Y. and Ioannidis, Y. E.",
  booktitle =    "SIGMOD'99",
  pages =        "215--226",
  year =         "1999"
}

@inproceedings{354819,
  author =       "Nick Koudas",
  title =        "Space efficient bitmap indexing",
  booktitle =    "CIKM '00",
  year =         "2000",
  isbn =         "1-58113-320-0",
  pages =        "194--201"
}

@inproceedings{1155030,
  author =       "Doron Rotem and Kurt Stockinger and Kesheng Wu",
  title =        "Minimizing {I/O} Costs of Multi-Dimensional Queries
                  with Bitmap Indices",
  booktitle =    "SSDBM '06",
  year =         "2006",
  isbn =         "0-7695-2590-3",
  pages =        "33--44"
}

@inproceedings{webb2007,
  author =       "Hazel Webb",
  title =        "Properties and Applications of Diamond Cubes",
  booktitle =    "ICSOFT 2007 -- Doctoral Consortium",
  year =         2007
}

@unpublished{webb2010,
  author = "Hazel Webb and Owen Kaser and Daniel Lemire",
  title = "Evaluating Multidimensional Queries by Diamond Dicing",
  year = 2010
}


@article{jurgens2001tbi,
  title =        "Tree Based Indexes Versus Bitmap Indexes: A
                  Performance Study",
  author =       "Jurgens, M. and Lenz, H. J.",
  journal =      "International Journal of Cooperative Information
                  Systems",
  volume =       "10",
  number =       "3",
  pages =        "355--376",
  year =         2001
}

@inproceedings{cai2005fat,
  author =       "Min Cai and Jianping Pan and Yu-Kwong Kwok and Kai
                  Hwang",
  title =        "Fast and accurate traffic matrix measurement using
                  adaptive cardinality counting",
  booktitle =    "{MineNet}'05",
  year =         "2005",
  pages =        {205--206}
}

@article{whang1990lin,
  author =       "Kyu-Young Whang and Brad T. Vander-Zanden and Howard
                  M. Taylor",
  title =        "A linear-time probabilistic counting algorithm for
                  database applications",
  journal =      "ACM Trans. Database Syst.",
  volume =       "15",
  number =       "2",
  year =         "1990",
  pages =        {208--229}
}

@article{alon1986,
  author =       "N. Alon and L. Babai and A. Itai",
  title =        "A fast and simple randomized parallel algorithm for
                  the maximal independent set problem",
  journal =      "J. Algorithms",
  volume =       "7",
  number =       "4",
  pages =        "567--583",
  year =         1986
}

@inproceedings{paquet2004tsi,
  title =        "Topic sharing infrastructure for weblog networks",
  author =       "Paquet, S. and Pearson, P.",
  booktitle =    "CNSR 2004",
  pages =        "301--304",
  year =         2004
}

@inproceedings{morzy2003hbi,
  title =        "Hierarchical Bitmap Index: An Efficient and Scalable
                  Indexing Technique for Set-Valued Attributes",
  author =       "Morzy, M. and Morzy, T. and Nanopoulos, A. and
                  Manolopoulos, Y.",
  booktitle =    "ADBIS 2003",
  year =         2003
}

@inproceedings{DBLP:conf/vldb/BurdickDJRV06,
  author =       "Douglas Burdick and Prasad M. Deshpande and
                  T. S. Jayram and Raghu Ramakrishnan and Shivakumar
                  Vaithyanathan",
  title =        "Efficient Allocation Algorithms for {OLAP} Over
                  Imprecise Data.",
  booktitle =    "VLDB'06",
  year =         "2006",
  pages =        "391-402",
  ee =           "http://www.vldb.org/conf/2006/p391-burdick.pdf",
  crossref =     "DBLP:conf/vldb/2006",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@article{Loevinger,
    author =    " Loevinger, J.",
    title =     "A systematic approach to the construction and evaluation of tests of ability",
    journal =   "Psychological Monographs",
    year =      "1947",
    volume =    "61 (No. 4)"
}

@inproceedings{brin97beyond,
  author = "Sergey Brin and
               Rajeev Motwani and
               Craig Silverstein",
  editor = "Joan Peckham",
  title = "Beyond Market Baskets: Generalizing Association Rules to Correlations",
  booktitle = "SIGMOD 1997",
  publisher = "ACM Press",
  year = "1997",
  pages = "265-276"
 }

  @Misc{dataminer,
  author = "{IBM}",
  title =   "{DB2} Intelligent Miner",
  howpublished = "\url{http://www-306.ibm.com/software/data/iminer/}(Last checked 07-29-2009)"
  }

@inproceedings{DBLP:conf/vldb/0003RBCY06,
  author =       "Lei Chen and Raghu Ramakrishnan and Paul Barford and
                  Bee-Chung Chen and Vinod Yegneswaran",
  title =        "Composite Subset Measures.",
  booktitle =    "VLDB'06",
  year =         "2006",
  pages =        "403-414",
  ee =           "http://www.vldb.org/conf/2006/p403-chen.pdf",
  crossref =     "DBLP:conf/vldb/2006",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{DBLP:conf/vldb/JiTT06,
  author =       "Liping Ji and Kian-Lee Tan and Anthony K. H. Tung",
  title =        "Mining Frequent Closed Cubes in 3D Datasets.",
  booktitle =    "VLDB'06",
  year =         "2006",
  pages =        "811-822",
  ee =           "http://www.vldb.org/conf/2006/p811-ji.pdf",
  crossref =     "DBLP:conf/vldb/2006",
  bibsource =    "DBLP, http://dblp.uni-trier.de",
  hidden =       "not in hazel course"
}

@proceedings{DBLP:conf/vldb/2006,
  editor =       "Umeshwar Dayal and Kyu-Young Whang and David
                  B. Lomet and Gustavo Alonso and Guy M. Lohman and
                  Martin L. Kersten and Sang Kyun Cha and Young-Kuk
                  Kim",
  title =        "Proceedings of the 32nd International Conference on
                  Very Large Data Bases, Seoul, Korea, September
                  12-15, 2006",
  booktitle =    "VLDB'06",
  publisher =    "ACM",
  year =         "2006",
  isbn =         "1-59593-385-9",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@InProceedings{binn:reverse-query-processing,
  author =       "Carsten Binnig and Donald Kossmann and Eric Lo",
  title =        "Reverse Query Processing",
  booktitle =    "IEEE 23rd International Conference on Data
                  Engineering",
  pages =        "506--515",
  year =         2007
}


@inproceedings{956064,
  author =       "Yannis Sismanis and Antonios Deligiannakis and
                  Yannis Kotidis and Nick Roussopoulos",
  title =        "Hierarchical dwarfs for the rollup cube",
  booktitle =    "DOLAP '03: Proceedings of the 6th ACM international
                  workshop on Data warehousing and OLAP",
  year =         "2003",
  isbn =         "1-58113-727-3",
  pages =        "17--24",
  location =     "New Orleans, Louisiana, USA",
  doi =          "http://doi.acm.org/10.1145/956060.956064",
  publisher =    "ACM Press",
  address =      "New York, NY, USA"
}

@inproceedings{564745,
  author =       "Yannis Sismanis and Antonios Deligiannakis and Nick
                  Roussopoulos and Yannis Kotidis",
  title =        "Dwarf: shrinking the {PetaCube}",
  booktitle =    "SIGMOD '02: Proceedings of the 2002 ACM SIGMOD
                  international conference on Management of data",
  year =         "2002",
  isbn =         "1-58113-497-5",
  pages =        "464--475",
  location =     "Madison, Wisconsin",
  doi =          "http://doi.acm.org/10.1145/564691.564745",
  publisher =    "ACM Press",
  address =      "New York, NY, USA"
}

@inproceedings{1031771,
  author =       "Jianlin Feng and Qiong Fang and Hulin Ding",
  title =        "PrefixCube: Prefix-sharing Condensed Data Cube",
  booktitle =    "DOLAP '04",
  year =         "2004",
  isbn =         "1-58113-977-2",
  pages =        "38--47",
  location =     "Washington, DC, USA",
  doi =          "http://doi.acm.org/10.1145/1031763.1031771",
  publisher =    "ACM Press",
  address =      "New York, NY, USA"
}

@inproceedings{879029,
  author =       "W. Wang and J. Feng and H. Lu and J. X. Yu",
  title =        "Condensed Cube: An Efficient Approach to Reducing
                  Data Cube Size",
  booktitle =    "ICDE '02",
  year =         "2002",
  pages =        "155",
  publisher =    "IEEE Computer Society",
  address =      "Washington, DC, USA",
}

@proceedings{DBLP:conf/waim/2001,
  editor =       "Xiaoyang Sean Wang and Ge Yu and Hongjun Lu",
  title =        "Advances in Web-Age Information Management, Second
                  International Conference, WAIM 2001, Xi'an, China,
                  July 9-11, 2001, Proceedings",
  booktitle =    "WAIM",
  publisher =    "Springer",
  series =       "Lecture Notes in Computer Science",
  volume =       "2118",
  year =         "2001",
  isbn =         "3-540-42298-6",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@Misc{SAS,
author =     "{SAS}",
title =     "Data Mining with SAS Enterprise Miner",
howpublished = "\url{http://www.sas.com/technologies/analytics/datamining/miner/#section=3}",
note = "(Last checked 07-29-2009)"
 }
@inproceedings{BarbaraW01,
  author =       "Daniel Barbar{\'a} and Xintao Wu",
  title =        "Finding Dense Clusters in Hyperspace: An Approach
                  Based on Row Shuffling.",
  booktitle =    "Advances in Web-age Information Management",
  year =         "2001",
  pages =        "305-316",
  ee =
                  "http://link.springer.de/link/service/series/0558/bibs/2118/21180305.htm",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{DBLP:conf/dawak/Lee06,
  author =       "Seok-Lyong Lee",
  title =        "An Effective Algorithm to Extract Dense Sub-cubes
                  from a Large Sparse Cube.",
  booktitle =    "DaWaK",
  year =         "2006",
  pages =        "155-164",
  ee =           "http://dx.doi.org/10.1007/11823728_15",
  crossref =     "DBLP:conf/dawak/2006",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@proceedings{DBLP:conf/dawak/2006,
  editor =       "A. Min Tjoa and Juan Trujillo",
  title =        "Data Warehousing and Knowledge Discovery, 8th
                  International Conference, DaWaK 2006, Krakow,
                  Poland, September 4-8, 2006, Proceedings.",
  booktitle =    "DaWaK",
  publisher =    "Springer",
  series =       "Lecture Notes in Computer Science",
  volume =       "4081",
  year =         "2006",
  isbn =         "3-540-37736-0",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{1150484,
  author =       {Riadh {Ben Messaoud} and Omar Boussaid and Sabine
                  {Loudcher Rabas{\'e}da}},
  title =        {Efficient Multidimensional Data Representations Based on Multiple Correspondence Analysis},
  booktitle =    {KDD'06},
  year =         {2006},
  isbn =         {1-59593-339-5},
  pages =        {662--667}
}

@proceedings{DBLP:conf/kdd/2006,
  editor =       "Tina Eliassi-Rad and Lyle H. Ungar and Mark Craven
                  and Dimitrios Gunopulos",
  title =        "Proceedings of the Twelfth ACM SIGKDD International
                  Conference on Knowledge Discovery and Data Mining,
                  Philadelphia, PA, USA, August 20-23, 2006",
  booktitle =    "KDD",
  publisher =    "ACM",
  year =         "2006",
  isbn =         "1-59593-339-5",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{1183678,
  author =       "Amit A. Nanavati and Siva Gurumurthy and Gautam Das
                  and Dipanjan Chakraborty and Koustuv Dasgupta and
                  Sougata Mukherjea and Anupam Joshi",
  title =        "On the structural properties of massive telecom call
                  graphs: findings and implications",
  booktitle =    "CIKM '06: Proceedings of the 15th ACM international
                  conference on Information and knowledge management",
  year =         "2006",
  isbn =         "1-59593-433-2",
  pages =        "435--444",
  location =     "Arlington, Virginia, USA",
  doi =          "http://doi.acm.org/10.1145/1183614.1183678",
  publisher =    "ACM Press",
  address =      "New York, NY, USA",
}

@article{1107340,
  author =       "Philip H. P. Nguyen and Dan Corbett",
  title =        "A Basic Mathematical Framework for Conceptual
                  Graphs",
  journal =      "IEEE Transactions on Knowledge and Data Engineering",
  volume =       "18",
  number =       "2",
  year =         "2006",
  issn =         "1041-4347",
  pages =        "261--271",
  doi =          "http://dx.doi.org/10.1109/TKDE.2006.18",
  publisher =    "IEEE Educational Activities Department",
  address =      "Piscataway, NJ, USA",
}

@article{godin95incremental,
  author =       "Robert Godin and Rokia Missaoui and Hassan Alaoui",
  title =        "Incremental concept formation algorithms based on
                  {Galois} (concept) lattices",
  journal =      "Computational Intelligence",
  volume =       "11",
  publisher =    "Blackwell Publishing",
  maybeEditor =  "Randy Goebel and Russell Greiner and Dekang Lin",
  comment =      "DEPRECATED DUPLICATE ENTRY, USE THE DBLP ONE BELOW",
  pages =        "246--267",
  year =         "1995"
}

@article{DBLP:journals/ci/GodinMA95,
  author =       "Robert Godin and Rokia Missaoui and Hassan Alaoui",
  title =        "Incremental Concept Formation Algorithms Based on
                  {Galois} (Concept) Lattices",
  journal =      "Computational Intelligence",
  volume =       "11",
  year =         "1995",
  pages =        "246-267",
  bibsource =    "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{874730,
  author =       "G. Antoshenkov",
  title =        "Byte-Aligned Bitmap Compression",
  booktitle =    "DCC'95",
  publisher = {IEEE Computer Society},
  address = {Washington, DC, USA},
  year =         1995,
  pages =        "476"
}

@inproceedings{pinar05,
  author =       "A. Pinar and T. Tao and H. Ferhatosmanoglu",
  title =        "Compressing Bitmap Indices by Data Reorganization",
  booktitle =    "ICDE'05",
  publisher = {IEEE Computer Society},
  address = {Washington, DC, USA},
  year =         "2005",
  pages =        {310--321}
}
@TechReport{cascon2007techreport,
  author =       "Owen Kaser and Daniel Lemire",
  title =        "Removing Manually Generated Boilerplate from
                  Electronic Texts: Experiments with {Project
                  Gutenberg} e-Books",
  institution =  "Dept. of CSAS, UNBSJ",
  number =       "TR-07-001",
  year =         "2007",
  note =         {available from \url{http://arxiv.org/abs/0707.1913}}
}

@inproceedings{kase:cascon07,
  author =       "Owen Kaser and Daniel Lemire",
  title =        "Removing Manually Generated Boilerplate from
                  Electronic Texts: Experiments with {Project
                  Gutenberg} e-Books",
  booktitle =    "CASCON'07",
  pages =        "272--275",
  year =         2007
}

@inproceedings{klink:bav,
  title =        "Browsing and visualizing digital bibliographic data",
  author =       "Klink, S. and Ley, M. and Rabbidge, E. and Reuther,
                  P. and Walter, B. and Weber, A.",
  booktitle =    "VisSym 2004",
  pages =        "19--21",
  year =         2004
}

@article{pqtrees,
  author =       "Booth, Kellogg S. and Lueker, George S.",
  year =         1976,
  title =        "Testing for the Consecutive Ones Property, Interval
                  Graphs, and Graph Planarity Using {PQ}-Tree
                  Algorithms",
  journal =      "Journal of Computer and System Sciences",
  volume =       13,
  pages =        "335--379"
}

@inproceedings{johnson2004clb,
  title =        "Compressing Large Boolean Matrices Using Reordering
                  Techniques",
  author =       "Johnson, D. S. and Krishnan, S. and Chhugani, J. and
                  Kumar, S. and Venkatasubramanian, S.",
  booktitle =    "VLDB'04",
  publisher = {VLDB Endowment},
  address= {San Jose, CA, USA},
  pages =        "13--23",
  year =         2004
}

@article{bhasker1987ola,
  title =        "Optimal Linear Arrangement of Circuit Components",
  author =       "Bhasker, J. and Sahni, S.",
  journal =      "J. VLSI Comp. Syst.",
  volume =       2,
  number =       1,
  pages =        "87--109",
  year =         1987
}

@inproceedings{1164200,
  author =       "Tan Apaydin and Guadalupe Canahuate and Hakan
                  Ferhatosmanoglu and Ali Saman Tosun",
  title =        "Approximate encoding for direct access and query
                  processing over compressed bitmaps",
  booktitle =    "VLDB '06",
  year =         "2006",
  pages =        {846--857}
}

@inproceedings{stockinger2004esb,
  title =        "Evaluation Strategies for Bitmap Indices with
                  Binning",
  author =       "Stockinger, K. and Wu, K. and Shoshani, A.",
  booktitle =    "{DEXA} '04",
  year =         "2004"
}

@inproceedings{671192,
  author =       {Roger Weber and Hans-J\"org Schek and Stephen
                  Blott},
  title =        "A Quantitative Analysis and Performance Study for
                  Similarity-Search Methods in High-Dimensional
                  Spaces",
  booktitle =    "VLDB '98",
  year =         "1998",
  pages =        {194--205}
}

@Misc{WuPatent2004,
  author =       "K. Wu and A. Shoshani and E. J. Otoo",
  title =        "Word aligned bitmap compression method, data
                  structure, and apparatus",
  howpublished = "US Patent Number 6,831,575",
  year =         2004
}

inproceedings{ley2002dcs,
  title="The {DBLP} Computer Science Bibliography: Evolution, Research Issues, Perspectives",
  author="Ley, M.",
  booktitle="9th International Symposium on String Processing and Information Retrieval",
  pages="1--10",
  year="2002",
  publisher={Springer}
}
@article{1083791,
  author =       "Ergin Elmacioglu and Dongwon Lee",
  title =        "On six degrees of separation in DBLP-DB and more",
  journal =      "SIGMOD Record",
  volume =       "34",
  number =       "2",
  year =         "2005",
  pages =        "33--40",
}

@inproceedings{878975,
  title =        "Data Cleaning and {XML}: The {DBLP} Experience",
  booktitle =    "ICDE '02",
  year =         "2002",
  pages =        269
}

@inproceedings{649755,
  author =       "Qiming Chen and Umeshwar Dayal and Meichun Hsu",
  title =        "{OLAP}-Based Data Mining for Business Intelligence
                  Applications in Telecommunications and E-commerce",
  booktitle =    "DNIS '00",
  year =         "2000",
  isbn =         "3-540-41395-2",
  pages =        "1--19"
}

@article{jaccard1912dfa,
  title =        "The Distribution of the Flora in the Alpine Zone",
  author =       "Jaccard, P.",
  journal =      "New Phytologist",
  volume =       "11",
  number =       "2",
  pages =        "37--50",
  year =         1912
}

@article{chazelle1988fad,
  title =        "A Functional Approach to Data Structures and Its Use
                  in Multidimensional Searching",
  author =       "Chazelle, B.",
  journal =      "SIAM J. Comput.",
  volume =       "17",
  number =       "3",
  pages =        "427--462",
  year =         1988
}

@inproceedings{donjerkovic1999pot,
  title =        "Probabilistic Optimization of Top N Queries",
  author =       "Donjerkovic, D. and Ramakrishnan, R.",
  booktitle =    "VLDB'99",
  pages =        "411--422",
  year =         1999
}

@inproceedings{253302,
  author =       "Michael J. Carey and Donald Kossmann",
  title =        "On Saying ``Enough already!'' in {SQL}",
  booktitle =    "SIGMOD'97",
  year =         "1997",
  isbn =         "0-89791-911-4",
  pages =        {219--230}
}

@inproceedings{luo2001rtb,
  title =        "Range Top/Bottom k Queries in {OLAP} Sparse Data
                  Cubes",
  author =       "Luo, Z. W. and Ling, T. W. and Ang, C. H. and Lee,
                  S. Y. and Cui, B.",
  booktitle =    "DEXA'01",
  pages =        "678--687",
  year =         2001
}

@inproceedings{loh2002amr,
  title =        "Adaptive Method for Range Top-k Queries in {OLAP}
                  Data Cubes",
  author =       "Loh, Z. X. and Ling, T. W. and Ang, C. H. and Lee,
                  S. Y.",
  booktitle =    "DEXA'02",
  pages =        "648--657",
  year =         2002
}

@inproceedings{584806,
  author =       "Zheng Xuan Loh and Tok Wang Ling and Chuan Heng Ang
                  and Sin Yeung Lee",
  title =        "Analysis of Pre-computed Partition Top Method for
                  Range Top-k Queries in {OLAP} Data Cubes",
  booktitle =    "CIKM'02",
  year =         "2002",
  pages =        {60--67}
}

@article{chung2007erm,
  title =        "An efficient, robust method for processing of
                  partial top-k/bottom-k queries using the {RD}-Tree
                  in {OLAP}",
  author =       "Chung, Y. D. and Yang, W. S. and Kim, M. H.",
  journal =      "Decision Support Systems",
  volume =       "43",
  number =       "2",
  pages =        "313--321",
  year =         "2007",
  publisher =    {Elsevier}
}

@article{seokjin:eer,
  title =        "Efficient Execution of Range Top-k Queries in
                  Aggregate R-Trees",
  author =       "Seokjin, H. and Moon, B. and Sukho, Lee",
  journal =      "IEICE -- Transactions on Information and Systems",
  volume = {E88-D},
  number = {11},
  year = {2005},
  issn = {0916-8532},
  pages = {2544--2554}
}

@inproceedings{564729,
  author =       "Arjen P. de Vries and Nikos Mamoulis and Niels Nes
                  and Martin Kersten",
  title =        "Efficient {k-NN} search on vertically decomposed
                  data",
  booktitle =    "SIGMOD'02",
  year =         "2002",
  pages =        {322--333}
}

@inproceedings{DBLP:conf/icde/BorzsonyiKS01,
  author =       "Stephan B{\"o}rzs{\"o}nyi and Donald Kossmann and
                  Konrad Stocker",
  title =        "The Skyline Operator",
  booktitle =    "ICDE '01",
  year =         "2001",
  pages =        "421-430",
  ee =
                  "http://doi.ieeecomputersociety.org/10.1109/ICDE.2001.914855",
  crossref =     "DBLP:conf/icde/2001",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@proceedings{DBLP:conf/icde/2001,
  title =        {Proceedings of the 17th International Conference on
                  Data Engineering, April 2-6, 2001, Heidelberg,
                  Germany},
  publisher =    "IEEE Computer Society",
  year =         "2001",
  isbn =         "0-7695-1001-9",
  bibsource =    {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{DBLP:conf/vldb/YiuM07,
  author    = {Man Lung Yiu and
               Nikos Mamoulis},
  title     = {Efficient Processing of Top-k Dominating Queries on Multi-Dimensional
               Data},
  booktitle = {VLDB'07},
  year      = {2007},
  pages     = {483-494},
  ee        = {http://www.vldb.org/conf/2007/papers/research/p483-yiu.pdf},
  renamedcrossref  = {DBLP:conf/vldb/2007},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@inproceedings{DBLP:conf/vldb/MorsePJ07,
  author    = {Michael D. Morse and
               Jignesh M. Patel and
               H. V. Jagadish},
  title     = {Efficient Skyline Computation over Low-Cardinality Domains},
  booktitle = {VLDB'07},
  year      = {2007},
  pages     = {267-278},
  ee        = {http://www.vldb.org/conf/2007/papers/research/p267-morse.pdf},
  renamedcrossref  = {DBLP:conf/vldb/2007},
  bibsource = "DBLP, http://dblp.uni-trier.de"
}

@inproceedings{lang:finding-markets,
  author =       "Kevin Lang and Reid Andersen",
  title =        "Finding dense and isolated submarkets in a sponsored
                  search spending graph",
  booktitle =    "CIKM",
  year =         2007,
  note =         "to appear"
}

@inproceedings{1240775,
 author = {A. W. Rivadeneira and Daniel M. Gruen and Michael J. Muller and David R. Millen},
 title = {Getting our head in the clouds: toward evaluation studies of tagclouds},
 booktitle = {CHI'07},
 year = {2007},
 isbn = {978-1-59593-593-9},
 pages = {995--998}
 }

@Article{kern:KL,
  author = 	 "Brian W. Kernighan and S. Lin",
  title = 	 "An Efficient Heuristic Procedure for Partitioning Graphs",
  journal =	 "Bell Systems Technical Journal",
  year =	 1970,
  volume =	 49,
  number =	 2,
  pages =	 "291--308"
}

@Misc{pref:fdl-class,
  author =       "{Prefuse Project}",
  title =        "Class {ForceDirectedLayout}",
  howpublished = "online, \url{http://prefuse.org/doc/api/prefuse/action/layout/graph/ForceDirectedLayout.html}",
  month =     jul,
  year =      2006,
  note =      "checked 21 Sept 2007"
}

@InProceedings{ames:why-we-tag,
  author =       "Morgan Ames and Mor Naaman",
  title =        "Why We Tag: Motivations for Annotation in Mobile and Online Media",
  booktitle =    "Proceedings, SIGCHI 2007",
  pages =        "971--980",
  year =         2007
}

@article{1232252,
 author = {Uriel Feige and James R. Lee},
 title = {An improved approximation ratio for the minimum linear arrangement problem},
 journal = {Inf. Process. Lett.},
 volume = {101},
 number = {1},
 pages = {26--29},
 year = {2007}
}

@inproceedings{suzuki2005dsp,
  title={Dense Subgraph Problem Revisited},
  author={Suzuki, A. and Tokuyama, T.},
  booktitle={Joint Workshop ``New Horizons in Computing'' and ``Statistical Mechanical Approach to Probabilistic Information Processing''},
  year={2005}
}

@InProceedings{suzuki2005dsp-b,
  author =       {Akiko Suzuki and Takeshi Tokuyama},
  title =        {Dense Subgraph Problems with Output-Density Conditions},
  booktitle = {Proceedings, ISAAC 2005 (LNCS 3827)},
  pages =     {266--276},
  year =      2005,
  publisher = {Springer-Verlag}}

@article{georgakopoulos2007mdr,
  title={{MAX-DENSITY} Revisited: a Generalization and a More Efficient Algorithm},
  author={Georgakopoulos, G. F. and Politopoulos, K.},
  journal={The Computer Journal},
  volume={50},
  number={3},
  pages={348},
  year={2007},
  publisher={Br Computer Soc}
}

@article{gallo1989fpm,
  title={A Fast Parametric Maximum Flow Algorithm and Applications},
  author={Gallo, G. and Grigoriadis, M. D. and Tarjan, R. E.},
  journal={SIAM Journal on Computing},
  volume={18},
  number={1},
  pages={30--55},
  year={1989},
  publisher={Society for Industrial and Applied Mathematics Philadelphia, PA, USA}
}

@article{asahiro2000gfd,
  title={Greedily Finding a Dense Subgraph},
  author={Asahiro, Y. and Iwama, K. and Tamaki, H. and Tokuyama, T.},
  journal={Journal of Algorithms},
  volume={34},
  number={2},
  pages={203--221},
  year={2000},
  publisher={Elsevier}
}

@inproceedings{658338,
 author = {Patrick E. O'Neil},
 title = {Model 204 Architecture and Performance},
 booktitle = {2nd International Workshop on High Performance Transaction Systems},
 year = {1989},
 publisher = {Springer-Verlag},
 address = {London, UK},
  pages = {40--59},
 }


@article{Dawande2001,
	author={ Milind Dawande and Pinar Keskinocak and Jayashankar M. Swaminathan and Sridhar Tayur},
	title={ On Bipartite and Multipartite Clique Problems},
	journal={Journal of Algorithms},
	volume={41},
	number={2},
	month={November},
	year={ 2001},
	pages={388--403}
}

@book{politis1999s,
  title={Subsampling},
  author={Politis, D. N. and Romano, J. P. and Wolf, M.},
  year={1999},
  publisher={Springer}
}

@inproceedings{babcock2003dss,
  title={Dynamic Sample Selection for Approximate Query Processing},
  author={Babcock, B. and Chaudhuri, S. and Das, G.},
  booktitle={SIGMOD'03},
  pages={539--550},
  year={2003}
}

@inproceedings{ganti2000ist,
  title={{ICICLES}: Self-Tuning Samples for Approximate Query Answering},
  author={Ganti, V. and Lee, M. L. and Ramakrishnan, R.},
  booktitle={VLDB'00},
  pages={176--187},
  year={2000}
}
@inproceedings{133210,
 author = {Alistair Moffat and Justin Zobel},
 title = {Parameterised compression for sparse bitmaps},
 booktitle = {SIGIR'92},
 year = {1992},
 pages = {274--285}
 }


    @inproceedings{313082,
 author = {Ravi Kumar and Prabhakar Raghavan and Sridhar Rajagopalan and Andrew Tomkins},
 title = {Trawling the {Web} for Emerging Cyber-communities},
 booktitle = {WWW '99},
 year = {1999},
 pages = {1481--1493},
 location = {Toronto, Canada},
 doi = {http://dx.doi.org/10.1016/S1389-1286(99)00040-7},
 publisher = {Elsevier North-Holland, Inc.},
 address = {New York, NY, USA},
 }

@InProceedings{pens:fault-tol-fca,
  author =       "Ruggero G. Pensa and {Jean-Fran\c{c}oise} Boulicaut",
  title =        "Fault Tolerant Formal Concept Analysis",
  booktitle =    "AI*IA 2005",
  pages =        "212--233",
  year =         2005,
  volume =       3673,
  series =       "LNAI",
  publisher =    "Springer-Verlag"
}



@article{wattenhofer2004fas,
  title={Fast and Simple Algorithms for Weighted Perfect Matching},
  author={Wattenhofer, M. and Wattenhofer, R.},
  journal={Electronic Notes in Discrete Mathematics},
  volume={17},
  pages={285--291},
  year={2004},
  publisher={Elsevier}
}

@article{kuhn2005hma,
  title={The {Hungarian} method for the assignment problem},
  author={Kuhn, H. W.},
  journal={Naval Research Logistics},
  volume={52},
  number={1},
  pages={7--21},
  year={2005}
}
@Misc{DBLPXML,
author="Michael Ley",
howpublished="\url{http://dblp.uni-trier.de/xml/}",
year=2008,
  note =         "last checked March, 2008"
}

@Misc{DBLPXML---fr,
author="Michael Ley",
howpublished="\url{http://dblp.uni-trier.de/xml/}",
year=2008,
  note =         "Dernier acc\`es en mars 2008"
}
@Misc{netflixprize,
  author =       "{Netflix, Inc.}",
  title =        "Nexflix Prize",
  howpublished = "\url{http://www.netflixprize.com}(Last checked 06-09-2010)",
  year =         2007
}

@Misc{netflixprize---fr,
  author =       "{Netflix, Inc.}",
  title =        "Nexflix Prize",
  howpublished = "\url{http://www.netflixprize.com}",
  year =         2007,
  note =         "Dernier acc\`es le 4 d\'ecembre 2007"
}
@misc{monashbigtera2007,
author={Curt Monash},
 title={DATAllegro heads for the high end},
 year=2007,
 howpublished="\url{http://www.dbms2.com/2007/07/25/datallegro-heads-for-the-high-end/}"
}



@inproceedings{reddy2001arw,
  title={An Approach to Relate the Web Communities through Bipartite Graphs},
  author={Reddy, P. K. and Kitsuregawa, M.},
  booktitle={WISE'01},
  pages={302--310},
  year={2001}
}

@article{yang2005irw,
  title=    "Information Retrieval on the Web",
  author=   "Yang, K.",
  journal=  "Annual Review of Information Science and Technology",
  volume=   39,
  pages=    "33--81",
  year=     2005
}

@inproceedings{1142547,
 author = {Cuiping Li and Beng Chin Ooi and Anthony K. H. Tung and Shan Wang},
 title = {{DADA}: a Data Cube for Dominant Relationship Analysis},
 booktitle = {SIGMOD'06},
 year = 2006,
 pages = {659--670},
 }

@inproceedings{DBLP:conf/sigmod/AgrawalGGR98,
  author    = {Rakesh Agrawal and
               Johannes Gehrke and
               Dimitrios Gunopulos and
               Prabhakar Raghavan},
  title     = {Automatic Subspace Clustering of High Dimensional Data for Data
               Mining Applications},
  booktitle = {SIGMOD'98},
  year      = 1998,
  pages     = {94--105}
}

@article{cheung2001tbd,
  title={Towards the building of a dense-region-based {OLAP} system},
  author={Cheung, D. W. and Zhou, B. and Kao, B. and Kan, H. and Lee, S. D.},
  journal={Data \& Knowledge Engineering},
  volume=36,
  number=1,
  pages={1--27},
  year=2001,
  publisher={Elsevier}
}


@Article{1348835,
  author = {Terracina, G. and Leone, N. and Lio, V. and Panetta, C.},
  title =  {Experimenting with Recursive Queries in Database and Logic Programming Systems},
  journal ={Theory and Practice of Logic Programming},
  volume = {8},
  number = {2},
  year = {2008},
  issn = {1471-0684},
  pages = {129--165},
  doi = {http://dx.doi.org/10.1017/S1471068407003158},
  publisher= {Cambridge University Press},
 address={New York, NY, USA},
}


@Book{thom:OLAP-book,
  author =       "Erik Thomsen",
  title =        "{OLAP} Solutions: Building Multidimensional Information Systems",
  publisher =    "Wiley",
  year =         2002,
  edition =      "second"
}


@inproceedings{1317339,
 author = "Michal Stabno and Robert Wrembel",
 title = "RLH: bitmap compression technique based on run-length and {Huffman} encoding",
 booktitle = "DOLAP '07: Proceedings of the ACM tenth international workshop on Data warehousing and OLAP",
 year = 2007,
 isbn = "978-1-59593-827-5",
 pages = "41--48",
 location = "Lisbon, Portugal",
 doi = "http://doi.acm.org/10.1145/1317331.1317339",
 publisher = "ACM",
 address = "New York, NY, USA",
 }

 @inproceedings{1142476,
 author = "Nicholas E. Taylor and Zachary G. Ives",
 title = "Reconciling while tolerating disagreement in collaborative data sharing",
 booktitle = "SIGMOD '06",
 year = 2006,
 isbn = "1-59593-434-0",
 pages = "13--24",
 location = "Chicago, IL, USA",
 doi = "http://doi.acm.org/10.1145/1142473.1142476",
 publisher = "ACM",
 address = "New York, NY, USA",
 }

 @inproceedings{1247631,
 author = "Todd J. Green and Grigoris Karvounarakis and Nicholas E. Taylor and Olivier Biton and Zachary G. Ives and Val Tannen",
 title = "{ORCHESTRA}: facilitating collaborative data sharing",
 booktitle = "SIGMOD '07",
 year = 2007,
 isbn = "978-1-59593-686-8",
 pages = "1131--1133",
 location = "Beijing, China",
 doi = "http://doi.acm.org/10.1145/1247480.1247631",
 publisher = "ACM",
 address = "New York, NY, USA",
 }

 @inproceedings{wang2007wbc,
  title="Web-based Collaborative Information Integration for Scientific Research",
  author="Wang, F. and Rabsch, C. and Kling, P. and Liu, P. and Pearson, J.",
  booktitle="ICDE 2007",
  pages="1232--1241",
  year=2007
}

@article{115366,
 author = "Harold N. Gabow and Robert E. Tarjan",
 title = "Faster scaling algorithms for general graph matching problems",
 journal = "J. ACM",
 volume = 38,
 number = 4,
 year = 1991,
 issn = "0004-5411",
 pages = "815--853",
 publisher = "ACM",
 address = "New York, NY, USA",
 }


@Book{text-mining-handbook,
  author =    "Ronen Feldman and James Sanger",
  title =        "The Text Mining Handbook",
  publisher =    "Cambridge University Press",
  year =         2007,
  annote =    "references mostly till 2002"
}

@Article{text-mining-survey-sigmod07,
  author =       "Anna Stavrianou and Periklis Andritsos and Nicolas
                  Nicoloyannis",
  title =        "Overview and Semantic Issues of Text Mining",
  journal =      "{SIGMOD} Record",
  year =         2007,
  volume =    36,
  number =    3,
  month =     "September"
}

@Article{schn:creativity-support-cacm,
  author = 	 "Ben Schneiderman",
  title = 	 "Creativity Support Tools",
  journal = 	 cacm,
  year = 	 2007,
  volume = 	 50,
  number = 	 12,
  pages = 	 "20--32",
  month = 	 "december"
}


@inproceedings{502689,
 author = {Kesheng Wu and Ekow J. Otoo and Arie Shoshani},
 title = {A performance comparison of bitmap indexes},
 booktitle = {CIKM '01},
 year = {2001},
 pages = {559--561}
 }

 @inproceedings{671874,
 author = {Sihem Amer-Yahia and Theodore Johnson},
 title = {Optimizing Queries on Compressed Bitmaps},
 booktitle = {VLDB '00},
 year = {2000},
 pages = {329--338} }


 @article{48015,
 author = {M. D. Grigoriadis and B. Kalantari},
 title = {A new class of heuristic algorithms for weighted perfect matching},
 journal = {J. ACM},
 volume = {35},
 number = {4},
 year = {1988},
 pages = {769--776} }

 @article{imielinska1997gch,
  title={A General Class of Heuristics for Minimum Weight Perfect Matching and Fast Special Cases with Doubly and Triply Logarithmic Errors},
  author={Imielinska, C.},
  journal={Algorithmica},
  volume={18},
  number={4},
  pages={544--559},
  year={1997}
}

@inproceedings{oneil2007bid,
  title={Bitmap Index Design Choices and Their Performance Implications},
  author={O'Neil, E. and O'Neil, P. and Wu, K.},
  booktitle={IDEAS 2007},
  pages={72--84},
  year={2007}
}

@inproceedings{1347164,
 author = {Michael Mitzenmacher and Salil Vadhan},
 title = {Why simple hash functions work: exploiting the entropy in a data stream},
 booktitle = {SODA '08},
 year = {2008},
 pages = {746--755}
 }

@book{anderson2006lt,
  title={The Long Tail},
  author={Anderson, C.},
  year={2006},
  publisher={Hyperion}
}


@article{yiannis2007ctf,
  title={Compression techniques for fast external sorting},
  author={Yiannis, J. and Zobel, J.},
  journal={The VLDB Journal},
  volume={16},
  number={2},
  pages={269--291},
  year={2007},
  publisher={Springer}
}

@Misc{xldb07---fr,
  author = " J. Becla and K.-T. Lim",
  title = "Report from the 1st Workshop on Extremely Large Databases",
  howpublished = "En ligne~: \url{http://www-conf.slac.stanford.edu/xldb07/xldb07_report.pdf}",
  note ="Dernier acc\`es le 22 avril 2008",
  year = 2007
  }
@Misc{xldb07,
  author = " J. Becla and K.-T. Lim",
  title = "Report from the 1st Workshop on Extremely Large Databases",
  howpublished = "online: \url{http://www-conf.slac.stanford.edu/xldb07/xldb07_report.pdf}",
  year = 2007
  }

@book{kimball1996dwt,
  title={The data warehouse toolkit: practical techniques for building dimensional data warehouses},
  author={Kimball, Ralph},
  year={1996},
  publisher={John Wiley \& Sons, Inc. New York, NY, USA}
}

@article{hammer2003cea,
  title={{CubiST++}: Evaluating Ad-Hoc {CUBE} Queries Using Statistics Trees},
  author={Hammer, J. and Fu, L.},
  journal={Distributed and Parallel Databases},
  volume={14},
  number={3},
  pages={221--254},
  year={2003},
  publisher={Springer}
}

@Comment  article{bellatreche2007sap,
@Comment   title={Selection and Pruning Algorithms for Bitmap Index Selection Problem Using Data Mining},
@Comment   author={Bellatreche, L. and Missaoui, R. and Necir, H. and Drias, H.},
@Comment   journal={LNCS},
@Comment   volume={4654},
@Comment   pages={221},
@Comment   year={2007},
@Comment   publisher={Springer}
@Comment }

@InProceedings{bellatreche2007sap,
  title={Selection and Pruning Algorithms for Bitmap Index Selection Problem Using Data Mining},
  author={Bellatreche, Ladjel and Missaoui, Rokia and Necir, Hamid and Drias, Habiba},
  booktitle = {DaWaK 2007 (LNCS 4654)},
  pages =     {221--230},
  year =      2007,
  publisher = {Springer}}

@inbook{davis2007idw,
  chapter={Indexing in Data Warehouses},
  author={Davis, K.C. and Gupta, A.},
  title={Data Warehouses and {OLAP}: Concepts, Architectures, and Solutions},
  year={2007},
  publisher={IRM Press}
}

@inproceedings{stockinger2002spa,
  title={Strategies for processing ad hoc queries on large data warehouses},
  author={Stockinger, K. and Wu, K. and Shoshani, A.},
  booktitle={DOLAP'02},
  pages={72--79},
  year={2002}
}

@inproceedings{1183529,
 author = {Ravi Darira and Karen C. Davis and Jennifer {Grommon-Litton}},
 title = {Heuristic design of property maps},
 booktitle = {DOLAP'06},
 year = {2006},
 pages = {91--98},
 }

@inproceedings{1083658,
 author = {Mike Stonebraker and Daniel J. Abadi and Adam Batkin and Xuedong Chen and Mitch Cherniack and Miguel Ferreira and Edmond Lau and Amerson Lin and Sam Madden and Elizabeth O'Neil and Pat O'Neil and Alex Rasin and Nga Tran and Stan Zdonik},
 title = {{C-Store}: a column-oriented {DBMS}},
 booktitle = {VLDB '05},
 publisher = {VLDB Endowment},
  address= {San Jose, CA, USA},
 year = {2005},
 pages = {553--564}
 }



@Unpublished{arxiv:0811.2904,
  author =       "Rasmus Pagh and S. Srinivasa Rao",
  title =        "Secondary Indexing in One Dimension: Beyond B-trees and Bitmap Indexes",
  note =         "available from
                \url{http://arxiv.org/abs/0811.2904}",
  year =         2008
}

@INPROCEEDINGS{1617427, 
author={ Zukowski, M. and Heman, S. and Nes, N. and Boncz, P.}, 
booktitle={ICDE '06}, 
title={Super-Scalar {RAM-CPU} Cache Compression},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA},
year={2006}, 
}


@inproceedings{Paradies:2010:JCE:1866480.1866510,
 author = {Paradies, Marcus and Lemke, Christian and Plattner, Hasso and Lehner, Wolfgang and Sattler, Kai-Uwe and Zeier, Alexander and Krueger, Jens},
 title = {How to juggle columns: an entropy-based approach for table compression},
 booktitle = {IDEAS '10},
 year = {2010},
 pages = {205--215}
}


@inproceedings{1247525,
 author = {Allison L. Holloway and Vijayshankar Raman and Garret Swart and David J. DeWitt},
 title = {How to Barter Bits for Chronons: Compression and Bandwidth Trade Offs for Database Scans},
 booktitle = {SIGMOD'07},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2007},
 pages = {389--400}
 }
@inproceedings{1453912,
 author = {Allison L. Holloway and David J. DeWitt},
 title = {Read-optimized databases, in depth},
 booktitle = {VLDB'08},
 publisher = {VLDB Endowment},
 address= {San Jose, CA, USA},
 year = {2008},
 pages = {502--513}
 }
@inproceedings{1327178,
 author = {Vicen\c{c} Beltran and Jordi Torres and Eduard Ayguad\'{e}},
 title = {Improving disk bandwidth-bound applications through main memory compression},
 booktitle = {MEDEA'07},
 year = {2007},
 pages = {57--63}
 }
 
 @article{1453924,
 author = {Lin Qiao and Vijayshankar Raman and Frederick Reiss and Peter J. Haas and Guy M. Lohman},
 title = {Main-memory scan sharing for multi-core CPUs},
 journal = {Proc. VLDB Endow.},
 volume = {1},
 number = {1},
 year = {2008},
 pages = {610--621}
 }
@inproceedings{aouiche2007cfp,
  title={A Comparison of Five Probabilistic View-size Estimation Techniques in {OLAP}},
  author={Aouiche, K. and Lemire, D.},
  booktitle={DOLAP'07},
  publisher={ACM},
   address = {New York, NY, USA},
  pages={17--24},
  year={2007}
}

@article{1272746,
 author = {Rishi Rakesh Sinha and Marianne Winslett},
 title = {Multi-resolution bitmap indexes for scientific data},
 journal = {ACM Trans. Database Syst.},
 volume = {32},
 number = {3},
 year = {2007},
 pages = {16}
 }
@inproceedings{1316694,
 author = {Kesheng Wu and Ekow Otoo and Arie Shoshani},
 title = {On the performance of bitmap indices for high cardinality attributes},
 booktitle = {VLDB'04},
 year = {2004},
 pages = {24--35}
 }


@Article{sava:monotone-gray-codes,
  author =       {Carla Savage and Peter Winkler},
  title =        {Monotone {Gray} Codes and the Middle Levels Problem},
  journal =      {Journal of Combinatorial Theory, A},
  year =         1995,
  volume =    70,
  number =    2,
  pages =     {230--248}}



@InBook{knut:vfour-fascicle-two,
  author =    {Donald E. Knuth},
  title =        {The Art of Computer Programming},
  chapter =      {fascicle 2},
  publisher =    {Addison Wesley},
  address={Reading, MA, USA},
  year =         2005,
  volume =       4}


@Article{godd:long-run-codes,
  author =       {Luis Goddyn and Pavol Gvozdjak},
  title =        {Binary {Gray} Codes with Long Bit Runs},
  journal =      {Electronic Journal of Combinatorics},
  year =         2003,
  volume =    10,
  number =    {R27},
  pages =     {1--10}}

@Manual{dell:deskstar-user-guide,
  title =        {Specifications: {Hitachi Deskstar P7K500 User's Guide}},
  author =    {Dell},
  note =      {\url{https://support.dell.com/support/edocs/storage/P160227/specs.htm}(Last checked 06--9-2010)},
year = {2009}
}
@Misc{hahn:weatherbench,
  author =	 "C. Hahn and S. Warren and J. London",
  title =	 "Edited Synoptic Cloud Reports from Ships
                  and Land Stations over the Globe, 1982--1991",
  howpublished = {\url{http://cdiac.ornl.gov/ftp/ndp026b/} (Last checked 06-09-2010)},
  month =	 Jan,
  year =	 2004
}
                  

@Misc{lucene2000,
  title={Lucene: A high-performance, full-featured text search engine library},
  author={Doug Cutting and others},
  howpublished = "\url{http://lucene.apache.org}~(checked 2009-01-12)",
  year={2000}
}

@inproceedings{796300,
 author = {P. Dagum and R. Karp and M. Luby and S. Ross},
 title = {An optimal algorithm for Monte Carlo estimation},
 booktitle = {FOCS'95},
 year = {1995}
 }
 
 @book{mot1,
	address = {New York, NY, USA},
	author = {Motwani, R.  and Raghavan, P. },
	citeulike-article-id = {3503974},
	keywords = {file-import-08-11-11},
	posted-at = {2008-11-11 15:43:05},
	priority = {0},
	publisher = {Cambridge University Press},
	title = {{Randomized Algorithms}},
	year = {1995}
}

@article{cohen1998haa,
  title={Hardware-assisted algorithm for full-text large-dictionary string matching using n-gram hashing},
  author={Jonathan D. Cohen},
  journal={Information Processing and Management},
  volume={34},
  number={4},
  pages={443--464},
  year={1998},
  publisher={Elsevier}
}

@article{cohen1999mqr,
  title={Massive Query Resolution for Rapid Selective Dissemination of Information},
  author={Jonathan D. Cohen},
  journal={Journal of the American Society for Information Science},
  volume={50},
  number={3},
  pages={195--206},
  year={1999}
}

@article{306482,
 author = {Jonathan D. Cohen},
 title = {An n-gram hash and skip algorithm for finding large numbers of keywords in continuous text streams},
 journal = {Softw. Pract. Exper.},
 volume = {28},
 number = {15},
 year = {1998},
 issn = {0038-0644},
 pages = {1605--1635},
 publisher = {John Wiley \& Sons, Inc.},
 address = {New York, NY, USA},
 }

@article{Carterette2005613,
title = "Comparing inverted files and signature files for searching a large lexicon",
journal = "Information Processing \& Management",
volume = "41",
number = "3",
pages = "613 - 633",
year = "2005",
note = "Cross-Language Information Retrieval",
issn = "0306-4573",
doi = "DOI: 10.1016/j.ipm.2003.12.003",
url = "http://www.sciencedirect.com/science/article/B6VC8-4BN0DSN-1/2/421bb1bebbb3c9d64d0a84daec25c52d",
author = "Ben Carterette and Fazli Can",
}

@article{Mehler200651,
title = "Dynamic Incremental Hashing in Program Model Checking",
journal = "Electronic Notes in Theoretical Computer Science",
volume = "149",
number = "2",
pages = "51 - 69",
year = "2006",
note = "Proceedings of the Third Workshop on Model Checking and Artificial Intelligence (MoChArt 2005)",
issn = "1571-0661",
doi = "DOI: 10.1016/j.entcs.2005.07.026",
url = "http://www.sciencedirect.com/science/article/B75H1-4J5Y9K6-5/2/27e99c37c6faf7bdae096f6b69217c13",
author = "Tilman Mehler and Stefan Edelkamp",
keywords = "model checking",
keywords = "state space search",
keywords = "hashing"
}

@article{Li20071,
title = "A fast and memory-efficient {N-gram} language model lookup method for large vocabulary continuous speech recognition",
journal = "Computer Speech \& Language",
volume = "21",
number = "1",
pages = "1 - 25",
year = "2007",
note = "",
issn = "0885-2308",
doi = "DOI: 10.1016/j.csl.2005.11.002",
url = "http://www.sciencedirect.com/science/article/B6WCW-4HV72DW-1/2/2948d2c96d1225ac0ada5d528b9143ea",
author = "Xiaolong Li and Yunxin Zhao"
}

@inproceedings{857699,
 author = {Randy L. Ribler and Marc Abrams},
 title = {Using Visualization to Detect Plagiarism in Computer Science Classes},
 booktitle = {INFOVIS'00},
 year = {2000},
 isbn = {0-7695-0804-9},
 pages = {173},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA},
 }

@article{shannon1951pae,
  title={Prediction and entropy of printed English},
  author={Shannon, C.E.},
  journal={Bell System Technical Journal},
  volume={30},
  number={1},
  pages={50--64},
  year={1951}
}

  
@misc{tan2006fpm,
  title={Fast pattern matching using large compressed databases},
  author={Tan, T. and Gould, S. and Williams, D. and Peltzer, E. and Barrie, R.M.},
  year={2006},
  note={{US} Patent App. 11/326,131}
}




@article{arxiv:0901.3751,
  author =       "Daniel Lemire and Owen Kaser and Kamel Aouiche",
  title =        "Sorting Improves Word-aligned Bitmap Indexes",
  journal =         "Data \& Knowledge Engineering",
  year= 2010,
  volume=69,
  number=1,
  pages={3--28},
  details =      "Accepted (possibly prior to) 28 August 2009"
}

@inproceedings{1250800,
 author = {F\"{u}rer, Martin},
 title = {Faster integer multiplication},
 booktitle = {STOC '07},
 year = {2007},
 pages = {57--66}
 }
 
 
 @inproceedings{ 10.1109/ICDE.2007.367892,
author = {Daniel J. Abadi and Daniel S. Myers and David J. DeWitt and Samuel R. Madden},
title = {Materialization Strategies in a Column-Oriented {DBMS}},
booktitle ={ICDE'07},
year = {2007},
pages = {466-475}
}

@inproceedings{1142548,
 author = {Abadi, Daniel and Madden, Samuel and Ferreira, Miguel},
 title = {Integrating compression and execution in column-oriented database systems},
 booktitle = {SIGMOD '06},
 publisher={ACM},
 address = {New York, NY, USA},
 year = {2006},
 pages = {671--682}
 }
 
 @inproceedings{253268,
 author = {O'Neil, Patrick and Quass, Dallan},
 title = {Improved query performance with variant indexes},
 booktitle = {SIGMOD '97},
 year = {1997},
 pages = {38--49}
 }

 @inproceedings{kaserdolap2008,
 author = {Owen Kaser and Daniel Lemire and Kamel Aouiche},
 title = {Histogram-Aware Sorting for Enhanced Word-Aligned Compression in Bitmap Indexes},
 booktitle = {DOLAP '08},
 year = {2008}
 }
 
 @article{richards1986dca,
  title={Data compression and {Gray}-code sorting},
  author={Richards, Dana},
  journal={Information Processing Letters},
  volume={22},
  number={4},
  pages={201--205},
  year={1986}
}

@article{1312181,
 author = {Anantha, Madhusudhanan and Bose, Bella and AlBdaiwi, Bader},
 title = {Mixed-Radix {Gray} Codes in {Lee} Metric},
 journal = {IEEE Transactions on Computers},
 volume = {56},
 number = {10},
 year = {2007},
 pages = {1297--1307}
 }
 
 @article{savage1997scg,
  title={A Survey of Combinatorial {Gray} Codes},
  author={Savage, Carla},
  journal={SIAM Review},
  volume={39},
  pages={605--629},
  year={1997}}


@conference{chapin1998hcb,
  title={Higher Compression from the {Burrows-Wheeler} Transform by Modified Sorting},
  author={Chapin, B. and Tate, S.R.},
  booktitle={Data Compression Conference},
  pages={532},
  year={1998}
}

@article{landau2004apd,
  title={Alphabet Permutation for Differentially Encoding Text},
  author={Landau, G.M. and Levi, O. and Skiena, Steven. and Brook, S.S.},
  journal={LECTURE NOTES IN COMPUTER SCIENCE},
  pages={216--217},
  year={2004},
  publisher={SPRINGER-VERLAG}
}

@article{ernvall1984csp,
  title={On the construction of spanning paths by {Gray}-code in compression of files},
  author={Ernvall, J.},
  journal={TSI. Technique et science informatiques},
  volume={3},
  number={6},
  pages={411--414},
  year={1984},
  publisher={Lavoisier}
}


@conference{poosala1997sew,
  title={Selectivity Estimation Without the Attribute Value Independence Assumption},
  author={Poosala, V. and Ioannidis, Y. E.},
  booktitle={VLDB'97},
  pages={486--495},
  year={1997}
}

@article{schwenk2007csl,
  title={Continuous space language models},
  author={Schwenk, H.},
  journal={Computer Speech \& Language},
  volume={21},
  number={3},
  pages={492--518},
  year={2007},
  publisher={Elsevier}
}
     @TECHREPORT{burrowswheeler1994,
     author={M. Burrows and D. Wheeler},
     title ={ A block sorting lossless data compression algorithm},
     number={124},
     institution ={Digital Equipment Corporation},
     year={1994}
     }
     
@article{rissanen1979arithmetic,
  title={{Arithmetic coding}},
  author={Rissanen, J. and Langdon, G.G.},
  journal={IBM Journal of Research and Development},
  volume={23},
  number={2},
  pages={149--162},
  issn={0018-8646},
  year={1979},
  publisher={IBM Corp.}
}

@article{li2007fam,
  title={A fast and memory-efficient {N}-gram language model lookup method for large vocabulary continuous speech recognition},
  author={Li, X. and Zhao, Y.},
  journal={Computer Speech \& Language},
  volume={21},
  number={1},
  pages={1--25},
  year={2007},
  publisher={Elsevier}
}


@article{holloway2008rod,
  title={Read-optimized databases, in depth},
  author={Holloway, A. L. and DeWitt, D. J.},
  journal={Proceedings of the VLDB Endowment},
  volume={1},
  number={1},
  pages={502--513},
  year={2008},
  publisher={VLDB Endowment}
}


@comment{duplicates dehne2007compressing.}

@article{dehne2007cdc,
  title={Compressing Data Cube in Parallel {OLAP} Systems},
  author={Dehne, F. and Eavis, T. and Liang, B.},
  journal={Data Science Journal},
  volume={6},
  number={0},
  pages={184--197},
  year={2007},
  publisher={J-STAGE}
}

@article{hamilton2007chi,
  title={Compact {Hilbert} Indices: Space-filling Curves for Domains with Unequal Side Lengths},
  author={Hamilton, Chris H. and Rau-Chaplin, Andrew},
  journal={Information Processing Letters},
  volume=105,
  number=5,
  pages={155--163},
  year={2007},
  publisher={Elsevier}
}


@conference{kamel1994hrt,
  title={{Hilbert R-tree}: An improved {R-tree} using fractals},
  author={Kamel, I. and Faloutsos, C.},
  booktitle={VLDB'94},
  publisher={Morgan Kaufmann Publishers Inc.},
  address = {San Francisco, CA, USA},
  pages={500--509},
  year={1994}}
 
 @article{flahive2007bcr,
  title={Balancing cyclic {R}-ary {Gray} codes},
  author={Flahive, M. and Bose, B.},
  journal={Electronic Journal of Combinatorics},
  volume={14},
  number={R31},
  pages={1},
  year={2007}
}


@inproceedings{331562,
 author = {Pinar, Ali and Heath, Michael T.},
 title = {Improving performance of sparse matrix-vector multiplication},
 booktitle = {Supercomputing '99},
 publisher = {ACM},
 address = {New York, NY, USA},
 year = {1999},
  note={{Article} {No.} 30}
 }

 @Misc{Maxima,
 author={William Schelter and others},
 title={Maxima, a Computer Algebra System},
howpublished="\url{http://maxima.sourceforge.net/}",
 year={1998}
 }
 
 @conference{scholer2002cii,
  title={Compression of inverted indexes for fast query evaluation},
  author={Scholer, F. and Williams, H.E. and Yiannis, J. and Zobel, J.},
  booktitle={SIGIR'02},
  publisher={ACM},
   address = {New York, NY, USA},
  pages={222--229},
  year={2002}
}
@article{10.1109/TSE.1985.231852,
author = {M.A. Bassiouni},
title = {Data Compression in Scientific and Statistical Databases},
journal ={IEEE Transactions on Software Engineering},
volume = {11},
number = {10},
year = {1985},
pages = {1047--1058}}

@inproceedings{1321546,
 author = {B\"{u}ttcher,, Stefan and Clarke,, Charles L. A.},
 title = {Index compression is good, especially for random access},
 booktitle = {CIKM'07},
 year = {2007},
 pages = {761--770}
 }
 @article{moffat1996sii,
  title={{Self-indexing inverted files for fast text retrieval}},
  author={Moffat, A. and Zobel, J.},
  journal={ACM Transactions on Information Systems},
  volume={14},
  number={4},
  pages={349--379},
  year={1996}
}
@inproceedings{1353407,
 author = {Eltabakh,, Mohamed Y. and Hon,, Wing-Kai and Shah,, Rahul and Aref,, Walid G. and Vitter,, Jeffrey S.},
 title = {The {SBC}-tree: an index for run-length compressed sequences},
 booktitle = {EDBT'08},
 year = {2008},
 pages = {523--534}
 }
 
 @article{1314854,
 author = {Vo,, Binh Dao and Vo,, Kiem-Phong},
 title = {Compressing table data with column dependency},
 journal = {Theor. Comput. Sci.},
 volume = {387},
 number = {3},
 year = {2007},
 pages = {273--283},
 }
 
 @inproceedings{672970,
 author = {Iyer,, Balakrishna R. and Wilhite,, David},
 title = {Data Compression Support in Databases},
 booktitle = {VLDB'94},
 year = {1994},
 pages = {695--704}
 }
 
 @article{golomb1966rle,
  title={Run-length encodings},
  author={Golomb, S. W.},
  journal={IEEE Transactions on Information Theory},
  volume={12},
  pages={399--401},
  year={1966}
}

@book{barnard08,
  title={Higher algebra},
  author={Samuel Barnard},
  year={2008},
  publisher={Barnard Press}
}



@Misc{prdh:website,
  author =    {{Programme de recherche en d\'emographie historique}},
  title =     {{PRDH} 1881},
  howpublished = {\url{http://www.prdh.umontreal.ca/census/en/main.aspx}},
  year =      2009,
  note =      {last checked 2010-11-11}}
  
@Misc{prdh:website-differentref,
  author =    {PRDH},
  title =     {The 1881 Canadian census database},
  howpublished = {\url{http://www.prdh.umontreal.ca/census/en/main.aspx}},
  year =      2009,
  note =      {last checked 2010-11-11}}


 
 
@article{flahive2008bcr,
  title={Balancing cyclic {R}-ary {Gray} codes {II}},
  author={Flahive, M.},
  journal={Electronic Journal of Combinatorics},
  volume={15},
  number={R128},
  pages={1},
  year={2008}
}

@conference{raman2008ctq,
  title={Constant-time query processing},
  author={Raman, V. and Swart, G. and Qiao, L. and Reiss, F. and Dialani, V. and Kossmann, D. and Narang, I. and Sidle, R.},
  booktitle={ICDE '08},
  pages={60--69},
  year={2008}
}
@article{1132964,
 author = {Graefe, Goetz},
 title = {Implementing sorting in database systems},
 journal = {ACM Comput. Surv.},
 volume = {38},
 number = {3},
 year = {2006},
 pages = {10},
 }
 
 @inproceedings{1516430,
 author = {Canahuate, Guadalupe and Apaydin, Tan and Sacan, Ahmet and Ferhatosmanoglu, Hakan},
 title = {Secondary bitmap indexes with vertical and horizontal partitioning},
 booktitle = {EDBT '09},
 year = 2009,
 pages = {600--611} }

@inproceedings{apay:data-reordering,
  author = "Tan Apaydin and Ali \c{S}aman Tosun and Hakan Ferhatosmanoglu",
  title = "Analysis of Basic Data Reordering Techniques",
  booktitle = "SSDBM 2008, LNCS 5096",
  year = 2008,
  pages = {517--524} }

@article{alber2000mch,
  title={On multidimensional curves with {Hilbert} property},
  author={Alber, J. and Niedermeier, R.},
  journal={Theory of Computing Systems},
  volume={33},
  number={4},
  pages={295--312},
  year={2000}
}
@inproceedings{1431053,
 author = {Haverkort, Herman and Walderveen, Freek},
 title = {Locality and Bounding-Box Quality of Two-Dimensional Space-Filling Curves},
 booktitle = {ESA '08},
 year = {2008},
 pages = {515--527}
 }
 @article{niedermeier2002tol,
  title={Towards optimal locality in mesh-indexings},
  author={Niedermeier, R. and Reinhardt, K. and Sanders, P.},
  journal={Discrete Applied Mathematics},
  volume={117},
  number={1-3},
  pages={211--237},
  year={2002}
}

@inproceedings{HaverkortW09,
  author    = {Herman J. Haverkort and
               Freek van Walderveen},
  title     = {Four-Dimensional {Hilbert} Curves for {R}-Trees},
  booktitle = {ALENEX '09},
  year      = {2009},
  pages     = {63--73}
}

@article{aouiche2009,
	title={Web 2.0 {OLAP}: From Data Cubes to Tag Clouds},
	journal={Lecture Notes in Business Information Processing},
	volume=18,
	year=2009,
	pages={51--64},
	author={Aouiche, Kamel and Lemire, Daniel and Godin, Robert}
}

@unpublished{rowreordering,
	title={Reordering Rows for Smaller Indexes: Beyond the Lexicographic Order},
	author={Daniel Lemire and Owen Kaser and Eduardo Gutarra},
	note={in preparation},
	year=2010
}

@unpublished{rlewithsorting,
	title={Reordering Columns for Smaller Indexes},
	author={Daniel Lemire and Owen Kaser},
	note={in preparation, available from \url{http://arxiv.org/abs/0909.1346}},
	year=2009
}


@conference{cardenal2002fast,
  title={Fast {LM} look-ahead for large vocabulary continuous speech recognition using perfect hashing},
  author={Cardenal-Lopez, A. and Diguez-Tirado, F. J. and Garcia-Mateo, C.},
  booktitle={ICASSP'02},
  pages={705--708},
  year={2002}
}

@conference{zhang2002minimum,
  title={Minimum perfect hashing for fast {N-gram} language model lookup},
  author={Zhang, X. and Zhao, Y.},
  booktitle={Seventh International Conference on Spoken Language Processing},
  year={2002},
  pages={401--404},
  organization={ISCA}
}

@article{talbot2008randomized,
  title={Randomized language models via perfect hash functions},
  author={Talbot, D. and Brants, T.},
  journal={ACL'08},
  pages={505--513},
  year={2008}
}
@conference{talbot2007smoothed,
  title={Smoothed {Bloom} filter language models: Tera-scale {LMs} on the cheap},
  author={Talbot, D. and Osborne, M.},
  booktitle={EMNLP'07},
  pages={468--476},
  year={2007}
}
@conference{talbot2007randomised,
  title={Randomised language modelling for statistical machine translation},
  author={Talbot, D. and Osborne, M.},
  booktitle={ACL'07},
  pages={512--519},
  year={2007}
}

@article{kornblum2006identifying,
  title={Identifying almost identical files using context triggered piecewise hashing},
  author={Kornblum, J.},
  journal={Digital Investigation},
  volume={3},
  pages={91--97},
  year={2006},
  publisher={Elsevier}
}

@INPROCEEDINGS{718147, 
title={A {DBMS} For Large Statistical Databases}, 
author={Turner, M. J. and Hammond, R. and Cotton, P.}, 
booktitle={VLDB'79}, 
 publisher = {VLDB Endowment},
 address= {San Jose, CA, USA},
year={1979}, 
pages={ 319--327}, 
}
@article{peano1890courbe,
  title={Sur une courbe, qui remplit toute une aire plane},
  author={Peano, G.},
  journal={Mathematische Annalen},
  volume={36},
  number={1},
  pages={157--160},
  year={1890},
  publisher={Springer}
}
@article{16877,
 author = {Faloutsos, Christos},
 title = {Multiattribute hashing using {Gray} codes},
 journal = {SIGMOD Record},
 volume = {15},
 number = {2},
 year = {1986},
 pages = {227--238}
 }
 @article{moon2001analysis,
  title={Analysis of the clustering properties of the Hilbert space-filling curve},
  author={Moon, B. and Jagadish, HV and Faloutsos, C. and Saltz, J.H.},
  journal={IEEE Transactions on Knowledge and Data Engineering},
  volume={13},
  number={1},
  year={2001}
}
@inproceedings{1458181,
 author = {Valle, Eduardo and Cord, Matthieu and Philipp-Foliguet, Sylvie},
 title = {High-dimensional descriptor indexing for large multimedia databases},
 booktitle = {CIKM '08},
 year = {2008},
 pages = {739--748}
 }
 @book{lebesgue1904lecons,
  title={{Le{\c{c}}ons sur l'int{\'e}gration et la recherche des fonctions primitives: profess{\'e}es au Coll{\`e}ge de France}},
  author={Lebesgue, H.L.},
  year={1904},
  publisher={Gauthier-Villars}
}

@incollection {eavis2007,
   author = {Eavis, Todd and Cueva, David},
   title = {A {Hilbert} Space Compression Architecture for Data Warehouse Environments},
   booktitle = {Data Warehousing and Knowledge Discovery},
   series = {Lecture Notes in Computer Science},
   pages = {1--12},
   volume = 4654,
   year = 2007,
   publisher = {Springer}
}
 @article{eavis2007hilbert,
  title={A {Hilbert} Space compression architecture for data warehouse environments},
  author={Eavis, T. and Cueva, D.},
  journal={Lecture Notes in Computer Science},
  volume={4654},
  pages={1--12},
  year={2007},
  publisher={Springer}
}

@article{dehne2007compressing,
  title={Compressing Data Cube in Parallel {OLAP} Systems},
  author={Dehne, F. and Eavis, T. and Liang, B.},
  journal={Data Science Journal},
  volume={6},
  number={0},
  pages={184--197},
  year={2007},
  publisher={J-STAGE}
}


@Article{lemire-OLA,
  author = 	 {Daniel Lemire and Owen Kaser},
  title = 	 {Hierarchical Bin Buffering: Online Local Moments for
Dynamic External Memory Arrays},
  journal = 	 {{ACM} Transactions on Algorithms},
  year = 	 2008,
  volume = 	 4,
  number = 	 1,
  pages = 	 {31~pages},
  note = 	 {article 14}}


@article{ailamaki2002data,
  title={Data page layouts for relational databases on deep memory hierarchies},
  author={Ailamaki, A. and DeWitt, D.J. and Hill, M.D.},
  journal={The VLDB Journal},
  volume={11},
  number={3},
  pages={198--215},
  year={2002},
  publisher={Springer}
}
  @inproceedings{318923,
 author = {Copeland, George P. and Khoshafian, Setrag N.},
 title = {A decomposition storage model},
 booktitle = {SIGMOD'85},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1985},
 pages = {268--279}}

 @inproceedings{1559879,
 author = {Ivanova, Milena G. and Kersten, Martin L. and Nes, Niels J. and Gon\c{c}alves, Romulo A.P.},
 title = {An architecture for recycling intermediates in a column-store},
 booktitle = {SIGMOD'09},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2009},
 pages = {309--320}
 }
 @inproceedings{1559877,
 author = {Binnig, Carsten and Hildenbrand, Stefan and F\"{a}rber, Franz},
 title = {Dictionary-based order-preserving string compression for main memory column stores},
 booktitle = {SIGMOD'09},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2009},
 pages = {283--296}}
 
 @inproceedings{1376712,
 author = {Abadi, Daniel J. and Madden, Samuel R. and Hachem, Nabil},
 title = {Column-stores vs. row-stores: how different are they really?},
 booktitle = {SIGMOD'08},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2008},
 pages = {967--980}
 }
 
 @inproceedings{1559878,
 author = {Idreos, Stratos and Kersten, Martin L. and Manegold, Stefan},
 title = {Self-organizing tuple reconstruction in column-stores},
 booktitle = {SIGMOD'09},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2009},
 pages = {297--308}
 }
 
 @inproceedings{1007570,
 author = {Gray, Jim},
 title = {The next database revolution},
 booktitle = {SIGMOD'04},
 publisher = {VLDB Endowment},
 address= {San Jose, CA, USA},
 year = {2004},
 pages = {1--4},
 }

@InProceedings{kuma:monk-architecture,
  title =        {{MONK} Project: Architecture Overview},
  year =         2009,
  author =       {Amit Kumar},
  booktitle = {JCDL'09},
  publisher = {ACM}}

@TechReport{meandre-tr,
  author =       {Xavier Llor\`{a}, Berie \'Acs, Loretta S. Auvil,
                   Boris Capitanu, Michael E. Welge and David E. Goldberg},
  title =        {Meandre: Semantic-Driven Data-Intensive Flows in the Clouds},
  institution =  {Dept. of Industrial and Enterprise Systems Engineering},
  year =         2008,
  number =    {2008-013},
  month =     oct}

@InProceedings{meandre,
  author =       {Xavier Llor\`{a} and Berie \'Acs and Loretta S. Auvil and
                   Boris Capitan and Michael E. Welge and David E. Goldberg},
  title =        {Meandre: Semantic-Driven Data-Intensive Flows in the Clouds},
  booktitle = {IEEE e-Science 2008},
  pages =     {238--245},
  year =      2008,
  month =     dec}

@Article{muel:literary-informatics,
  author =       {Martin Mueller},
  title =        {Digital {Shakespeare}, or towards a literary informatics},
  journal =      {Shakespeare},
  year =         2008,
  volume =    4,
  number =    3,
  pages =     {284--301}}




@InProceedings{sank:digitizing-million,
  author =       {K. Pramod Sankar and Vamshi Ambati and
      Lakshmi Pratha and C. V. Jawahar},
  title =        {Digitizing a Million Books: Challenges for
      Document Analysis},
  booktitle = {DAS 2006 (LNCS 3872)},
  pages =     {425--436},
  year =      2006,
  publisher = {Springer-Verlag}}



@InProceedings{vuil:near-martha,
  author =       {Romain Vuillemot and Tanya Clement and Catherine Plaisant
     and Amit Kumar},
  title =        {What's Being Said Near ``{Martha}"? {Exploring} Name Entities
    in Literary Text Collections},
  booktitle = {IEEE Symposium on Visual Analytics and Technology '09},
  year =      2009,
  publisher = {IEEE},
  note =      {also U. Maryland CS TR2009-12}}



@Book{more:trees-book,
  author =    {Franco Moretti},
  title =        {Graphs,Maps, Trees: Abstract models for literary history},
  publisher =    {Verso},
  year =         2005,
  address =   {New York}}

@Misc{mona:ebay-dw,
  author =    {Curt Monash},
  title =     {{eBay's} two enormous data warehouses},
  howpublished = {\url{http://www.dbms2.com/2009/04/30/ebays-two-enormous-data-warehouses/}},
  month =     apr,
  year =      2009}


@Misc{mona:yahoo-dw,
  author =    {Curt Monash},
  title =     {Yahoo is up to 10 Petabytes now?},
  howpublished = {\url{http://www.dbms2.com/2009/07/06/yahoo-is-up-to-10-petabytes-now/}},
  month =     jul,
  year =      2009}

@Misc{kell:scan-this-book,
  author =    {Peter Kelly},
  title =     {Scan This Book!},
  howpublished = {New York Times Magazine (14 May 2006)},
  year =      2006}

@Article{shil:dank-cellar,
  author =       {Peter Shillingsburg},
  title =        {The dank cellar of electronic text},
  journal =      llc,
  year =         2009,
  volume =    24,
  number =    1,
  pages =     {19--25}}


@InProceedings{abou:hadoopDB,
  author =       {Azza Abouzeid and Kamil {Bajda-Pawlikowski} and
                   Daniel Abadi and Avi Silberschatz and Alexander Rasin},
  title =        {{HadoopDB}: An Architectural Hybrid of {MapReduce} and 
                      {DBMS} Technologies for Analytical Workloads},
  booktitle = {VLDB'09},
  year =      2009,
  month =     aug,
  IGNorganization = {VLDB Endowment},
  publisher = {ACM}}

@Article{peng:quantitative,
  author =       {Roger D. Peng and Nicolas W. Hengartner},
  title =        {Quantitative Analysis of Literary Styles},
  journal =      {The American Statistician},
  year =         2002,
  volume =    56,
  number =    3}



@Article{will:sentence-length,
  author =       {C. B. Williams},
  title =        {A Note on the Statistical Analysis of Sentence-Length as
a Criterion of Literary Style},
  journal =      {Biometrika},
  year =         1940,
  volume =    31,
  pages =     {356--361},
  annote =    {need to verify}
}

@inproceedings{DBLP:conf/vldb/GuptaS06,
  author    = {Rahul Gupta and
               Sunita Sarawagi},
  title     = {Creating Probabilistic Databases from Information Extraction
               Models},
  booktitle = {VLDB'06},
  year      = {2006},
  pages     = {965-976},
  ee        = {http://www.vldb.org/conf/2006/p965-gupta.pdf},
  jcrossref  = {DBLP:conf/vldb/2006},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@inproceedings{1325861,
 author = {R\'{e}, Christopher and Suciu, Dan},
 title = {Materialized views in probabilistic databases: for information exchange and query optimization},
 booktitle = {VLDB '07},
 year = {2007},
 isbn = {978-1-59593-649-3},
 pages = {51--62},
 location = {Vienna, Austria},
 publisher = {VLDB Endowment},
 }

@inproceedings{DBLP:conf/soda/JayramKV07,
  author    = {T. S. Jayram and
               Satyen Kale and
               Erik Vee},
  title     = {Efficient aggregation algorithms for probabilistic data},
  booktitle = {SODA'07},
  year      = {2007},
  pages     = {346-355},
  ee        = {http://doi.acm.org/10.1145/1283383.1283420},
  unusedcrossref  = {DBLP:conf/soda/2007},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}



@article{1538810,
 author = {Dalvi, Nilesh and R\'{e}, Christopher and Suciu, Dan},
 title = {Probabilistic databases: diamonds in the dirt},
 journal = {Commun. ACM},
 volume = {52},
 number = {7},
 year = {2009},
 issn = {0001-0782},
 pages = {86--94},
 doi = {http://doi.acm.org/10.1145/1538788.1538810},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@Misc{ramsan6200,
  author =    {{Texas Memory Systems}},
  title =     {{Products-RamSan-6200}},
  howpublished = {\url{http://www.ramsan.com/products/ramsan-6200.htm}},
  year =      2009,
  price =     {4.4M USD; 140kUSD for 2TB unit; 18kUSD for intermal 500G unit},
  note =      {last checked 2009-09-19}}


@Misc{micr:ddr-doc-2004,
  author =    {{Micron Technology}},
  title =     {{DDR2} and Fully Buffered {DIMMs}: Status and Trends},
  howpublished = {\url{http://www.memforum.org/upload/Micron.pdf}},
  month =     sep,
  year =      2004,
  annote =    {last checked 2009-09-19}
}

@Misc{internet-archive-texts,
  author =    {{Internet Archive}},
  title =     {Text Archive},
  howpublished = {\url{http://www.archive.org/details/texts}},
  note =      {last checked 2009-09-19}}

@article{1516062,
 author = {Agrawal, Rakesh and Ailamaki, Anastasia and Bernstein, Philip A. and Brewer, Eric A. and Carey, Michael J. and Chaudhuri, Surajit and Doan, Anhai and Florescu, Daniela and Franklin, Michael J. and Garcia-Molina, Hector and Gehrke, Johannes and Gruenwald, Le and Haas, Laura M. and Halevy, Alon Y. and Hellerstein, Joseph M. and Ioannidis, Yannis E. and Korth, Hank F. and Kossmann, Donald and Madden, Samuel and Magoulas, Roger and Ooi, Beng Chin and O'Reilly, Tim and Ramakrishnan, Raghu and Sarawagi, Sunita and Stonebraker, Michael and Szalay, Alexander S. and Weikum, Gerhard},
 title = {The {Claremont} report on database research},
 journal = cacm,
 volume = {52},
 number = {6},
 year = {2009},
 issn = {0001-0782},
 pages = {56--65},
 doi = {http://doi.acm.org/10.1145/1516046.1516062},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@article{1373451,
 author = {Juola, Patrick},
 title = {Authorship attribution},
 journal = {Found. Trends Inf. Retr.},
 volume = {1},
 number = {3},
 year = {2006},
 issn = {1554-0669},
 pages = {233--334},
 doi = {http://dx.doi.org/10.1561/1500000005},
 publisher = {Now Publishers Inc.},
 address = {Hanover, MA, USA},
 }


@Article{sich:better-than-zipf,
  author =       {H. S. Sichel},
  title =        {On a Distribution Law for Word Frequencies},
  journal =      {Journal of the American Statistical Association},
  year =         1975,
  volume =    70,
  pages =     {542--547},
  annote =    {said to be better than Zipf in ACL/ALLC'97 panel forum}
}



@InCollection{meun:carat-classification,
  author =    {Jean Guy Meunier and Dominic Forest and Ismail Biskri},
  booktitle =        {Handbook of Categorization in Cognative Science},
  title =      {Classification and Categorization in Computer Assisted
                    Reading and Analysis of Texts},
  editor =    {Henri Cohen and Claire Lefebvre},
  publisher =    {Elsevier},
  year =         2005}
}

@InProceedings{kirs:remaking-reading,
  author =       {Matthew G. Kirschenbaum},
  title =        {The Remaking of Reading: Data Mining and the Digital Humanities},
  booktitle = {{NSF} Sympos. Next Gen. Data Mining and Cyber-Enabled Disc. for Innov.'07},
  year =      2007,
  note =      {online: \url{http://www.cs.umbc.edu/~hillol/NGDM07/abstracts/talks/MKirschenbaum.pdf} checked 2009-09-19}}


@InProceedings{don:text-mining-and-visualization,
  author =       {Anthony Don and Elena Zheleva and Machon Gregory and Sureyya Tarkan and Loretta Auvil and Tanya Clement and Ben Schneiderman and Catherine
Plaisant},
  title =        {Discovering Interesting Usage Patterns in Text Collections:
                  Integrating Text Mining with Visualization},
  booktitle = {CIKM'07},
  pages =     {213--222},
  year =      2007,
  publisher = {ACM}}



@Article{pere:integratingDW,
  author =       {Juan Manuel P\'erez and Rafael Berlanga and Mar\'\i{}a Jos\'e Aramburu and Torben Bach Pedersen},
  title =        {Integrating Data Warehousing with {Web} Data: A Survey},
  journal =      {{IEEE} Trans. Knowl. Data Eng.},
  year =         2008,
  volume =    20,
  number =    7,
  pages =     {940--955}}

@inproceedings{1610557,
 author = {Leung, Carson Kai-Sang and Brajczuk, Dale A.},
 title = {Efficient algorithms for mining constrained frequent patterns from uncertain data},
 booktitle = {U '09: Proceedings of the 1st ACM SIGKDD Workshop on Knowledge Discovery from Uncertain Data},
 year = {2009},
 isbn = {978-1-60558-675-5},
 pages = {9--18},
 location = {Paris, France},
 doi = {http://doi.acm.org/10.1145/1610555.1610557},
 publisher = {ACM},
 address = {New York, NY, USA},
 }




@InProceedings{fuji:topiography,
  author =       {Ko Fujimura and Shigeru Fujimura and Tatsushi Matsubayashi
and Takeshi Yamada and Hidenori Okuda},
  title =        {Topiography: Visualization for Large-scale Tag Clouds},
  year =         2008,
  pages =        "1087--1088",
  booktitle = {WWW'08}}


@InProceedings{inok:OLAP-text-cikm07,
  author =       {Akihiro Inokuchi and Koichi Takeda},
  title =        {A Method of Online Analytical Processing of Text Data},
  booktitle = {CIKM'07},
  year =      2007,
  organization = {ACM}}


@InProceedings{rava:top-keyword,
  author =       {Franck Ravat and Olivier Teste and Ronan Tournier and
                     Gilles Zurfluh},
  title =        {{Top\_Keyword}: An Aggregation Function for Textual
                   Document {OLAP}},
  booktitle = {DaWaK'08},
  pages =     {55-64},
  year =      2008,
  publisher = {Springer-Verlag},
  note =   {LNCS 5182}}




@Article{juol:prototype,
  author =       {Patrick Juola and John Sofko and Patrick Brennan},
  title =        {A Prototype for Authorship Attribution Studies},
  journal =      llc,
  year =         2006,
  volume =    21,
  number =    2,
  pages =     {169--178}}


@Article{stol:polaris-cacm,
  author =       {Chris Stolte and Diane Ting and Pat Hanrahan},
  title =        {Polaris: A System for Query, Analysis, and Visualization
                    of Multidimensional Databases},
  journal =      cacm,
  year =         2008,
  volume =    51,
  number =    11,
  pages =     {75--84},
  month =     nov}

@InProceedings{terrier,
  author =       {Iadh Ounis and others},
  title =        {Terrier: A High Performance and Scalable Information Retrieval Platform},
  booktitle = {SIGIR'06 Workshop on Open Source Inf. Retr.},
  year =      2006}


@InProceedings{lai:querying-treebanks,
  author =       {Catherine Lai and Steven Bird},
  title =        {Querying and Updating Treebanks: A Critical Survey
and Requirements Analysis},
  booktitle = {Australasian Lang. Tech. Workshop},
  year =      2004}

@inproceedings{DBLP:conf/icde/WiwatwattanaJLS07,
  author    = {Nuwee Wiwatwattana and
               H. V. Jagadish and
               Laks V. S. Lakshmanan and
               Divesh Srivastava},
  title     = {X$^{\mbox{3}}$: A Cube Operator for {XML OLAP}},
  booktitle = {ICDE},
  year      = {2007},
  pages     = {916-925},
  ee        = {http://dx.doi.org/10.1109/ICDE.2007.367937},
  dcrossref  = {DBLP:conf/icde/2007},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@Article{stav:text-mining-survey,
  author =       {Anna Stavrianou and Periklis Andritsos and Nicolas Nicoloyannis},
  title =        {Overview and Semantic Issues of Text Mining},
  journal =      {{SIGMOD} Record},
  year =         2007,
  volume =    36,
  number =    {23--34}}

@inproceedings{DBLP:conf/ssdbm/JensenMP01,
  author    = {Mikael R. Jensen and
               Thomas H. M{\o}ller and
               Torben Bach Pedersen},
  title     = {Specifying {OLAP} Cubes On {XML} Data},
  booktitle = {SSDBM},
  year      = {2001},
  pages     = {101-112},
  xcrossref  = {DBLP:conf/ssdbm/2001},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}


@article{ 10.1109/SSDM.1997.621175,
author = {Hans-J. Lenz and Arie Shoshani},
title = {Summarizability in {OLAP} and Statistical Data Bases},
journal ={Scientific and Statistical Database Management, International Conference on},
volume = 0,
year = 1997,
isbn = {0-8186-7952-2},
pages = 132,
doi = {http://doi.ieeecomputersociety.org/10.1109/SSDM.1997.621175},
publisher = {IEEE Computer Society},
address = {Los Alamitos, CA, USA},
}



@Article{alba:funny-billion,
  author =       {Alfredo Alba and Varun Bhagwan and Mike Ching and Alex Cozzi
and Raj Desai and Daniel Gruhl and Kevin Haas and Linda Kato and 
Jeff Kusnitz and Bryan Langston and Ferdy Nagy and Linda Nguyen and
Jan Pieper and Savitha Srinivastan and Anthony Stuart and Renjie Tang},
  title =        {A Funny Thing Happened on the Way to a Billion \ldots},
  journal =      {Bulletin of the Technical Committee on Data Engineering},
  year =         2006,
  volume =    31,
  number =    4,
  pages =     {27--36}}

@Misc{gate-url,
  author = 	 {{NLP Group, U. Sheffield}},
  title = 	 {{GATE, A General Architecture for Text Engineering}},
  howpublished = {\url{http://gate.ac.uk/}}}
  

@Misc{whatlanguage-url,
  author = 	 {{Peter Cooper}},
  title = 	 {{WhatLanguage: Ruby Library To Detect The Language Of A Text}},
  howpublished = {\url{http://www.rubyinside.com/whatlanguage-ruby-language-detection-library-1085.html}}}
  

@Article{pasa:mining-metaphors,
  author =       {Brad Pasanek and D. Sculley},
  title =        {Mining Millions of Metaphors},
  journal =      llc,
  year =         2008,
  volume =    23,
  number =    3}



@Misc{pasa:metaphor-searcher,
  author =    {Brad Pasanak},
  title =     {The Mind is a Metaphor},
  howpublished = {\url{http://mind.textdriven.com/db/browse.php?}},
  note =      {last checked 2009-09-26}}

Martin Ph. (2003). Correction and Extension of WordNet 1.7.
ICCS 2003, 11th International Conference on Conceptual Structures,
(© Springer Verlag, LNAI 2746, pp. 160-173), Dresden, Germany, July 21-25, 2003. 

@InProceedings{mart:integration-wordnet17,
  author =       {Philippe Martin},
  title =        {Correction and Extension of WordNet 1.7},
  booktitle = {ICCS'03 (LNAI 2746)},
  year =      2003}




@InProceedings{qi:imperfect-integration-sigmod,
  author =       {Yan Qi and K. Sel\c{c}uk Candan and Junichi Tatemura
 and Songting Chen and Fenglin Liao},
  title =        {Supporting {OLAP} Operations over Imperfectly Integrated
Taxonomies},
  booktitle = {SIGMOD'08},
  pages =     {875--888},
  year =      2008,
  organization = {ACM}}


@inproceedings{dbpubs,
 author = {Baid, Akanksha and Balmin, Andrey and Hwang, Heasoo and Nijkamp, Erik and Rao, Jun and Reinwald, Berthold and Simitsis, Alkis and Sismanis, Yannis and van Ham, Frank},
 title = {{DBPubs:} multidimensional exploration of database publications},
 booktitle = {PVLDB'08},
 year = {2008},
 pages = {1456--1459},
 doi = {http://doi.acm.org/10.1145/1454159.1454199},
 publisher = {VLDB Endowment},
 }



@Article{wind:monarchia-stemmatic,
  author =       {Heather F. Windram and Prue Shaw and Peter Robinson and Christopher J. Howe},
  title =        {Dante's \textit{Monarchia} as a Test Case for the Use
 of Phylogenetic Methods in Stemmatic Analysis},
  journal =      llc,
  year =         2008,
  volume =    23,
  number =    4}



@Article{jock:mormon-attribution,
  author =       {Matthew L. Jockers and Daniela M. Witten and Craig S. Criddle},
  title =        {Reassessing Authorship of the \textit{Book of Mormon} using
delta and nearest shunken centroid classification},
  journal =      llc,
  year =         2008,
  volume =    23,
  number =    4}

@article{952932,
 author = {Park, Chang-Sup and Kim, Myoung Ho and Lee, Yoon-Joon},
 title = {Usability-based caching of query results in {OLAP} systems},
 journal = {J. Syst. Softw.},
 volume = {68},
 number = {2},
 year = {2003},
 issn = {0164-1212},
 pages = {103--119},
 doi = {http://dx.doi.org/10.1016/S0164-1212(02)00142-5},
 publisher = {Elsevier Science Inc.},
 address = {New York, NY, USA},
 }

@Article{sun:incremental-tensor,
  author =       {Jimeng Sun and Dacheng Tao and Spiros Papadimitriou and Philip S. Yu and Christos Faloutsos},
  title =        {Incremental Tensor Analysis: Theory and Applications},
  journal =      {ACM Trans. KDD},
  year =         2008,
  volume =    2,
  number =    3}

@inproceedings{1287437,
 author = {Lee, Young-Koo and Whang, Kyu-Young and Moon, Yang-Sae and Song, Il-Yeol},
 title = {A one-pass aggregation algorithm with the optimal buffer size in multidimensional {OLAP}},
 booktitle = {VLDB '02},
 year = {2002},
 pages = {790--801},
 location = {Hong Kong, China},
 publisher = {VLDB Endowment},
 }

@article{781550,
 author = {Lee, Young-Koo and Whang, Kyu-Young and Moon, Yang-Sae and Song, Il-Yeol},
 title = {An aggregation algorithm using a multidimensional file in multidimensional {OLAP}},
 journal = {Inf. Sci.},
 volume = {152},
 number = {1},
 year = {2003},
 issn = {0020-0255},
 pages = {121--138},
 doi = {http://dx.doi.org/10.1016/S0020-0255(03)00077-X},
 publisher = {Elsevier Science Inc.},
 address = {New York, NY, USA},
 }


@Misc{tapo:recipes,
  author =       "{TAPoR Project}",
  title =        "{TAPoR} Portal Recipes",
  howpublished = "online: \url{http://tada.mcmaster.ca/Main/TaporRecipes}",
  year =         2009,
  note =         {checked 2010-08-30}
}

@Misc{monk:javadoc,
  author =    {{MONK Project}},
  title =     {{MONK} Javadoc},
  howpublished = "online: \url{http://monkproject.org/docs/monk-datastore-doc/}",
  note =      {last checked 08-30-2010}}

@article{1538805,
 author = {Graefe, Goetz},
 title = {The five-minute rule 20 years later (and how flash memory changes the rules)},
 journal = cacm,
 volume = {52},
 number = {7},
 year = {2009},
 issn = {0001-0782},
 pages = {48--59},
 doi = {http://doi.acm.org/10.1145/1538788.1538805},
 publisher = {ACM},
 address = {New York, NY, USA},
 }

@article{ailamaki2001weaving,
  title={Weaving relations for cache performance},
  author={Ailamaki, A. and DeWitt, D.J. and Hill, M.D. and Skounakis, M.},
  journal={The VLDB Journal},
  pages={169--180},
  year={2001},
  publisher={Citeseer}
}
@article{zaker2008,
  title={An Adequate Design for Large Data Warehouse Systems: Bitmap Index Versus {B-Tree} Index},
  author={Zaker, M. and Phon-Amnuaisuk, S. and Haw, S.C.},
  journal={International Journal of Computers and Communications},
  volume={2},
  number={2},
  pages={39--46},
  year={2008}
}

@inproceedings{DBLP:conf/dolap/MissaouiGCB07,
  author    = {Rokia Missaoui and
               Cyril Goutte and
               Anicet Kouomou Choupo and
               Ameur Boujenoui},
  title     = {A Probabilistic Model for Data Cube Compression and Query
               Approximation},
  booktitle = {DOLAP},
  year      = {2007},
  pages     = {33-40}
}

@inproceedings{brunoelephant,
 author = {Nicolas Bruno},
 title = {Teaching an Old Elephant New Tricks},
 booktitle = {CIDR '09},
 year = {2009}
 }
 
 
@conference{malik2007optimizing,
  title={Optimizing Frequency Queries for Data Mining Applications},
  author={Malik, H. H. and Kender, J. R.},
  booktitle={ICDM'07},
  pages={595--600},
  year={2007},
  publisher = {IEEE Computer Society},
  address = {Washington, DC, USA},
}

@article{rosenkrantz1977analysis,
  title={An analysis of several heuristics for the traveling salesman problem},
  author={Rosenkrantz, D.J. and Stearns, R.E. and {Lewis II}, P.M.},
  journal={SIAM J. Comput.},
  volume={6},
  number={3},
  pages={563--581},
  year={1977},
  publisher={Springer}
}
@article{hahsler2007tsp,
  title={{TSP}--Infrastructure for the traveling salesperson problem},
  author={Hahsler, M. and Hornik, K.},
  journal={Journal of Statistical Software},
  volume={23},
  number={2},
  pages={1--21},
  year={2007},
  publisher={Citeseer}
}

@article{kahng2004match,
  title={Match twice and stitch: a new {TSP} tour construction heuristic},
  author={Kahng, A.B. and Reda, S.},
  journal={Operations Research Letters},
  volume={32},
  number={6},
  pages={499--509},
  year={2004},
  publisher={Elsevier}
}
@article{clarke1964scheduling,
  title={Scheduling of vehicles from a central depot to a number of delivery points},
  author={Clarke, G. and Wright, J. W.},
  journal={Operations research},
  volume=12,
  number=4,
  pages={568--581},
  year={1964},
  publisher={Operations Research Society of America}
}

@article{Bertsimas1989241,
title = "Worst-case examples for the spacefilling curve heuristic for the {Euclidean} traveling salesman problem",
journal = "Operations Research Letters",
volume = "8",
number = "5",
pages = "241--244",
year = "1989",
author = "Dimitris Bertsimas and Michelangelo Grigni"
}


@article{platzman1989spacefilling,
  title={Spacefilling curves and the planar travelling salesman problem},
  author={Platzman, L.K. and {Bartholdi III}, J.J.},
  journal={Journal of the ACM (JACM)},
  volume={36},
  number={4},
  pages={719--737},
  year={1989}}

@InCollection{johnson2004,
  author     = 	 {Johnson, David S. and McGeoch, Lyle A.},
  title      = 	 {Experimental analysis of heuristics for the {STSP}},
  booktitle  = 	 {The Traveling Salesman Problem and Its Variations},
  pages      =	 {369--443},
  publisher  =	 {Springer},
  year       =	 2004,
  editor     =	 {Gregory Gutin and Abraham P. Punnen}
}




@article{cesari1996divide,
  title={Divide and conquer strategies for parallel {TSP} heuristics},
  author={Cesari, G.},
  journal={Computers and Operations Research},
  volume={23},
  number={7},
  pages={681--694},
  year={1996},
  publisher={Elsevier}
}



@article{helsgaun2000effective,
  title={An effective implementation of the {Lin--Kernighan} traveling salesman heuristic},
  author={Helsgaun, K.},
  journal={European Journal of Operational Research},
  volume={126},
  number={1},
  pages={106--130},
  year={2000},
  publisher={Elsevier}
}

@article{applegate2003chained,
  title={Chained {Lin-Kernighan} for large traveling salesman problems},
  author={Applegate, D. and Cook, W. and Rohe, A.},
  journal={INFORMS Journal on Computing},
  volume={15},
  number={1},
  pages={82--92},
  year={2003}
}
@conference{gionis1999similarity,
  title={Similarity search in high dimensions via hashing},
  author={Gionis, A. and Indyk, P. and Motwani, R.},
  booktitle={VLDB'99},
  publisher = {Morgan Kaufmann Publishers Inc.},
  address = {San Francisco, CA, USA},
  year={1999}
}

@conference{johnson1996asymptotic,
  title={Asymptotic experimental analysis for the {Held-Karp} traveling salesman bound},
  author={Johnson, D. S. and McGeoch, L. A. and Rothberg, E. E.},
  booktitle={SODA'96},
  pages={341--350},
  year={1996}
}

@article{Glover2001555,
title = {Construction heuristics for the asymmetric TSP},
journal = "European Journal of Operational Research",
volume = "129",
number = "3",
pages = "555 - 568",
year = "2001",
issn = "0377-2217",
author = "Fred Glover and Gregory Gutin and Anders Yeo and Alexey Zverovich"
}

@article{1629195,
 author = {Hyde, Julian},
 title = {Data in flight},
 journal = {Commun. ACM},
 volume = {53},
 number = {1},
 year = {2010},
 issn = {0001-0782},
 pages = {48--52},
 doi = {http://doi.acm.org/10.1145/1629175.1629195},
 publisher = {ACM},
 address = {New York, NY, USA},
 }
 
 @article{1365816,
 author = {Chang, Fay and Dean, Jeffrey and Ghemawat, Sanjay and Hsieh, Wilson C. and Wallach, Deborah A. and Burrows, Mike and Chandra, Tushar and Fikes, Andrew and Gruber, Robert E.},
 title = {Bigtable: A Distributed Storage System for Structured Data},
 journal = {ACM Trans. Comput. Syst.},
 volume = {26},
 number = {2},
 year = {2008},
 pages = {1--26}
 }
 
 @inproceedings{boncz2005, 
   author={P. Boncz and M. Zukowski and N. Nes},
  title={{MonetDB/X100}: Hyper-Pipelining Query Execution},
  booktitle={CIDR '05},
  year ={2005}
 }
 @INPROCEEDINGS{655800, 
author={Goldstein, J. and Ramakrishnan, R. and Shaft, U.}, 
booktitle={Data Engineering, 1998. Proceedings., 14th International Conference on}, title={Compressing relations and indexes}, 
year={1998}, 
month=feb, 
volume={}, 
number={}, 
pages={370 -379}, 
keywords={B-trees;R-trees;buffer pool;cardinality fields;decision support systems;disk throughput;fact tables;gzip;index compression;index structures;lossy compression;memory utilization;numeric fields;page level compression;records;relation compression;relational database;tree data structures;tuple decompression;buffer storage;data compression;decision support systems;relational databases;software performance evaluation;tree data structures;}, 
doi={10.1109/ICDE.1998.655800}, 
ISSN={1063-6382},}
 @Article{Szepkuti:2004:DifferenceSequence,
  author =         "Istv{\'a}n Sz{\'e}pk{\'u}ti",
  title =          "Difference sequence compression of multidimensional databases",
  journal =        "Periodica Polytechnica Electrical Engineering",
  year =           "2004",
  volume =         "48",
  number =         "3-4",
  pages =          "197--218",
  URL =            "http://www.pp.bme.hu/ee/2004_3/pdf/ee2004_3_07.pdf",
  abstract-url =   "http://www.pp.bme.hu/ee/2004_3/ee2004_3_07.html",
  topic =          "OLAP",
  subtopic =       "Compression"
}


@conference{raman2006wring,
  title={How to wring a table dry: Entropy compression of relations and querying of compressed relations},
  author={Raman, V. and Swart, G.},
  booktitle={VLDB'06},
  pages={858--869},
  year={2006}
}
@inproceedings{656226,
 author = {Goldstein, Jonathan and Ramakrishnan, Raghu and Shaft, Uri},
 title = {Compressing Relations and Indexes},
 booktitle = {ICDE '98},
 year = {1998},
 isbn = {0-8186-8289-2},
 pages = {370--379},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA},
 }
@article{Eavis2010259,
title = "Parallel {OLAP} with the {Sidera} server",
journal = "Future Generation Computer Systems",
volume = "26",
number = "2",
pages = "259 - 266",
year = "2010",
author = "Todd Eavis and George Dimitrov and Ivan Dimitrov and David Cueva and Alex Lopez and Ahmad Taleb"
}

@InProceedings{yuan:fsm-state-duplication,
  author =       {Lin Yuan and Gang Qu and Tiziano Villa and Alberto {Sangiovanni-Vincentelli}},
  title =        {{FSM} Re-Engineering and Its Application in Low Power State Encoding},
  booktitle = {Proceedings, Asia South Pacific Design Automation Conference (ASP-DAC)},
  pages =     {254--259},
  also =      "cf Scott van Wart's Honours project, UNBSJ 2005",
  year =      2005
}

@inproceedings{258541,
 author = {Trevisan, Luca},
 title = {When {Hamming} meets {Euclid}: the approximability of geometric {TSP} and {MST}},
 booktitle = {STOC '97},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1997},
 isbn = {0-89791-888-6},
 pages = {21--29}
 }
 
 @article{ernvall1985np,
  title={{NP}-completeness of the {Hamming} salesman problem},
  author={Ernvall, J. and Katajainen, J. and Penttonen, M.},
  journal={BIT Numerical Mathematics},
  volume={25},
  number={1},
  pages={289--292},
  year={1985},
  publisher={Springer}
}

@inproceedings{10.1109/SSDM.1999.787635,
author = {Martin Schaller},
title = {Reclustering of High Energy Physics Data},
booktitle ={SSDM'99},
publisher = {IEEE Computer Society},
address = {Washington, DC, USA},
year = {1999}
}

@inproceedings{1286703---usejournalversioninsteadBatory:1979:STF:320107.320125,
 author = {Batory, Don S.},
 title = {On searching transposed files},
 booktitle = {VLDB'78},
 publisher={Morgan Kaufmann Publishers Inc.},
 year = {1978},
 pages = {488--488}
  }
  
  @article{Batory:1979:STF:320107.320125,
   author = {Batory, D. S.},
   title = {On searching transposed files},
   journal = {ACM Trans. Database Syst.},
   volume = {4},
   issue = {4},
   month = {December},
   year = {1979},
   issn = {0362-5915},
   pages = {531--544},
   numpages = {14},
   url = {http://doi.acm.org/10.1145/320107.320125},
   doi = {http://doi.acm.org/10.1145/320107.320125},
   acmid = {320125},
   publisher = {ACM},
   address = {New York, NY, USA}}
 
 
@conference{abadi2008column,
  title={Column-stores vs. row-stores: how different are they really?},
  author={Abadi, D. J. and Madden, S. R. and Hachem, N.},
  booktitle={SIGMOD'08},
  publisher={ACM},
   address = {New York, NY, USA},
  pages={967--980},
  year={2008}}
  
@article{flahive2007balancing,
  title={{Balancing cyclic R-ary {Gray} codes}},
  author={Flahive, M. and Bose, B.},
  journal={Electronic Journal of Combinatorics},
  volume={14},
  number={R31},
  pages={1},
  year={2007}
}

@article{ng1997block,
  title={{Block-oriented compression techniques for large statistical databases}},
  author={Ng, W.K. and Ravishankar, C.V.},
  journal={IEEE Transactions on Knowledge and Data Engineering},
  volume={9},
  number={2},
  pages={314--328},
  year={1997}
}

@conference{houkjoer2006simple,
  title={Simple and realistic data generation},
  author={Houkj{\ae}r, K. and Torp, K. and Wind, R.},
  booktitle={VLDB'06},
  publisher = {VLDB Endowment},
  address= {San Jose, CA, USA},
  pages={1243--1246},
  year={2006}
}
@inproceedings{1457160,
 author = {Zukowski, Marcin and Nes, Niels and Boncz, Peter},
 title = {{DSM} vs. {NSM}: {CPU} performance tradeoffs in block-oriented query processing},
 booktitle = {DaMoN '08},
 year = {2008},
 publisher = {ACM},
 address = {New York, NY, USA},
 pages = {47--54}
 }
 
 @inproceedings{656552,
 author = {Padmanabhan, Sriram and Malkemus, Timothy and Agarwal, Ramesh C. and Jhingran, Anant},
 title = {Block Oriented Processing of Relational Database Operations in Modern Computer Architectures},
 booktitle = {ICDE' 01},
 publisher = {IEEE Computer Society},
 address = {Washington, DC, USA},
 year = {2001},
 pages = {567--574}
 }
 
@article{blockminisnphard,
author={Salim Haddadi},
title={A note on the {NP}-hardness of the consecutive block minimization problem},
journal={International Transactions in Operational Research},
volume={9},
number={6},
pages={775--777},
year=2002
}

@article{bentley1992fast,
  title={Fast algorithms for geometric traveling salesman problems},
  author={Bentley, J.J.},
  journal={INFORMS Journal on Computing},
  volume={4},
  number={4},
  pages={387},
  year={1992}
}
@conference{bentley1980analysis,
  title={An analysis of two heuristics for the {Euclidean} traveling salesman problem},
  author={Bentley, J.L. and Saxe, J.},
  booktitle={Proc. 18th Annual Allerton Conference on Communication, Control, and Computing},
  pages={41--49},
  year={1980}
}



@article{garey1976some,
  title={Some simplified {NP}-complete graph problems},
  author={Garey, MR and Johnson, L.},
  journal={Theoretical Computer Science},
  volume=1,
  number=3,
  pages={237--267},
  year=1976,
  publisher={Elsevier}
}

@article{lin1973effective,
  title={{An effective heuristic algorithm for the traveling-salesman problem}},
  author={Lin, S. and Kernighan, B. W.},
  journal={Operations research},
  volume=21,
  number=2,
  pages={498--516},
  year={1973},
  publisher={Operations Research Society of America}
}

@article{croes1958method,
  title={A method for solving traveling-salesman problems},
  author={Croes, G. A.},
  journal={Operations Research},
  pages={791--812},
  year={1958},
  Volume=6,
  number=6,
  publisher={Operations Research Society of America}
}


@Article{Sahinalp2004,
  author =       "S. Cenk Sahinalp and Andrey Utis",
  title =        "Hardness of String Similarity Search and Other Indexing Problems",
  journal =      "Lecture Notes in Computer Science",
  year =         2004,
  volume =       3142,
  pages =        {365--400}
}

@inproceedings{10.1109/SFCS.1994.365720,
author = {D. Greene and M. Parnas and F. Yao},
title = {Multi-index hashing for information retrieval},
booktitle ={FOCS'94},
volume = {0},
isbn = {0-8186-6580-7},
year = {1994},
pages = {722--731}}

@inproceedings{258656,
 author = {Indyk, Piotr and Motwani, Rajeev and Raghavan, Prabhakar and Vempala, Santosh},
 title = {Locality-preserving hashing in multidimensional spaces},
 booktitle = {STOC '97},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1997},
 isbn = {0-89791-888-6},
 pages = {618--625}
 }
 
 @book{Perceptrons1969,
 	author={M. Minsky and S. Papert},
 	title={Perceptrons},
 	publisher={MIT Press},
 	year={1969},
 	address={Cambridge, Massachusetts, USA}
 }
 
@conference{sculley2010web,
  title={{Web-scale k-means clustering}},
  author={Sculley, D.},
  booktitle={WWW 2010},
  pages={1177--1178},
  year={2010},
  organization={ACM}
}



@inproceedings{1514907,
 author = {Ross, Kenneth A. and Cieslewicz, John},
 title = {Optimal splitters for database partitioning with size bounds},
 booktitle = {ICDT '09},
 year = {2009},
 isbn = {978-1-60558-423-2},
 pages = {98--110}
 }
 
 @inproceedings{db2luw2009,
 author = {Bhattacharjee, Bishwaranjan and Lim, Lipyeow and Malkemus, Timothy and Mihaila, George and Ross, Kenneth and Lau, Sherman and McArthur, Cathy and Toth, Zoltan and Sherkat, Reza}, 
 title = {Efficient index compression in {DB2 LUW}},
 booktitle={VLDB'09},
 publisher = {VLDB Endowment},
  address= {San Jose, CA, USA},
 pages = {1462--1473},
 year={2009}
 }
 
@inproceedings{Poess:2003:DCO:1315451.1315531,
 author = {Poess, Meikel and Potapov, Dmitry},
 title = {Data compression in Oracle},
 booktitle = {Proceedings of the 29th international conference on Very large data bases - Volume 29},
 series = {VLDB '2003},
 year = {2003},
 isbn = {0-12-722442-4},
 location = {Berlin, Germany},
 pages = {937--947},
 numpages = {11},
 url = {http://portal.acm.org/citation.cfm?id=1315451.1315531},
 acmid = {1315531},
 publisher = {VLDB Endowment},
} 
 
 @inproceedings{1739071,
 author = {Deli\`{e}ge, Fran\c{c}ois and Pedersen, Torben Bach},
 title = {Position list word aligned hybrid: optimizing space and performance for compressed bitmaps},
 booktitle = {EDBT '10},
 publisher = {ACM},
 address = {New York, NY, USA},
 year = {2010}
 }
 
 @inproceedings{276876,
 author = {Indyk, Piotr and Motwani, Rajeev},
 title = {Approximate nearest neighbors: towards removing the curse of dimensionality},
 booktitle = {STOC '98},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1998},
 pages = {604--613}
 }
 @conference{haveliwala2000scalable,
  title={Scalable techniques for clustering the web},
  author={Haveliwala, T. H. and Gionis, A. and Indyk, P.},
  booktitle={WebDB (Informal Proceedings)},
  volume={129},
  pages={134},
  year={2000},
  organization={Citeseer}
}
 
 @inproceedings{301325,
 author = {Chakrabarti, Amit and Chazelle, Bernard and Gum, Benjamin and Lvov, Alexey},
 title = {A lower bound on the complexity of approximate nearest-neighbor searching on the {Hamming} cube},
 booktitle = {STOC '99},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1999},
 isbn = {1-58113-067-8},
 pages = {305--311}
 }
 @article{liu2004strong,
  title={A strong lower bound for approximate nearest neighbor searching},
  author={Liu, D.},
  journal={Information Processing Letters},
  volume={92},
  number={1},
  pages={23--29},
  year={2004}
}

@inproceedings{276877,
 author = {Kushilevitz, Eyal and Ostrovsky, Rafail and Rabani, Yuval},
 title = {Efficient search for approximate nearest neighbor in high dimensional spaces},
 booktitle = {STOC '98},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {1998},
 isbn = {0-89791-962-9},
 pages = {614--623}
 }
 
 @article{1526989,
 author = {Haas, Peter J. and Ilyas, Ihab F. and Lohman, Guy M. and Markl, Volker},
 title = {Discovering and Exploiting Statistical Properties for Query Optimization in Relational Databases: A Survey},
 journal = {Stat. Anal. Data Min.},
 volume = {1},
 number = {4},
 year = {2009},
 pages = {223--250}
 }
 
 @article{1151106,
 author = {Gryz, Jarek and Liang, Dongming},
 title = {Holes in joins},
 journal = {J. Intell. Inf. Syst.},
 volume = {26},
 number = {3},
 year = {2006},
 pages = {247--268}
 }


@inproceedings{1007641,
 author = {Ilyas, Ihab F. and Markl, Volker and Haas, Peter and Brown, Paul and Aboulnaga, Ashraf},
 title = {{CORDS}: automatic discovery of correlations and soft functional dependencies},
 booktitle = {SIGMOD '04},
 year = {2004},
 isbn = {1-58113-859-8},
 pages = {647--658}
 }
 
@conference{brown2003bhunt,
  title={{BHUNT: Automatic discovery of fuzzy algebraic constraints in relational data}},
  author={Brown, P.G. and Hass, P.J.},
  booktitle={VLDB '03},
  year={2003}
}

@conference{lim2003sash,
  title={{SASH: A self-adaptive histogram set for dynamically changing workloads}},
  author={Lim, L. and Wang, M. and Vitter, J.S.},
  booktitle={VLDB '03},
  pages={380},
  year={2003}
}

@article{edmonds2003mining,
  title={Mining for empty spaces in large data sets},
  author={Edmonds, J. and Gryz, J. and Liang, D. and Miller, R.J.},
  journal={Theoretical Computer Science},
  volume={296},
  number={3},
  pages={435--452},
  year={2003},
  publisher={Elsevier}
}


@book{1550806,
 author = {Kaminsky, Alan},
 title = {Building Parallel Programs: SMPs, Clusters \& Java},
 year = {2009},
 isbn = {1423901983, 9781423901983},
 publisher = {Course Technology Press},
 address = {Boston, MA, United States},
 }
 
 @inproceedings{10.1109/DCC.2007.44,
author = {Martin Burtscher and Paruj Ratanaworabhan},
title = {High Throughput Compression of Double-Precision Floating-Point Data},
booktitle ={DCC'07},
year = {2007},
pages = {293-302}
}

@article{lindstrom2006fast,
  title={Fast and efficient compression of floating-point data},
  author={Lindstrom, P. and Isenburg, M.},
  journal={IEEE Transactions on Visualization and Computer Graphics},
  volume={12},
  number={5},
  pages={1245--1250},
  year={2006}
}
@conference{ratanaworabhan2006fast,
  title={Fast lossless compression of scientific floating-point data},
  author={Ratanaworabhan, P. and Ke, J. and Burtscher, M.},
  booktitle={DCC'06},
  pages={133--142},
  year={2006}
}
@conference{engelson2000lossless,
  title={Lossless compression of high-volume numerical data from simulations},
  author={Engelson, V. and Fritzson, D. and Fritzson, P.},
  booktitle={DCC'00},
  pages={574--586},
  year={2000}
}

@article{moffat2000binary,
  title={Binary interpolative coding for effective index compression},
  author={Moffat, A. and Stuiver, L.},
  journal={Information Retrieval},
  volume={3},
  number={1},
  pages={25--47},
  year={2000},
  publisher={Springer}
}
@article{elias1975universal,
  title={Universal codeword sets and representations of the integers},
  author={Elias, P.},
  journal={IEEE Transactions on Information Theory},
  volume={21},
  number={2},
  pages={194--203},
  year={1975}
}
@article{gavett1965three,
  title={Three heuristic rules for sequencing jobs to a single production facility},
  author={Gavett, J.W.},
  journal={Management Science},
  volume={11},
  number={8},
  pages={166--176},
  year={1965},
  publisher={JSTOR}
}

@comment{garey1976some,
  title={Some {NP}-complete geometric problems},
  author={Garey, M. R. and Graham, R. L. and Johnson, D. S.},
  booktitle={STOC'76},
  pages={10--22},
  year={1976}
}
@article{bellmore1968traveling,
  title={The traveling salesman problem: a survey},
  author={Bellmore, M. and Nemhauser, G. L.},
  journal={Operations Research},
  volume={16},
  number={3},
  pages={538--558},
  year={1968},
  publisher={JSTOR}
}

@article{flood1956,
  title={The traveling-salesman problem},
  author={Flood, M. M.},
  journal={Operations Research},
  volume={4},
  number={6},
  pages={61--75},
  year={1956}
}

@article{bhat1996balanced,
  title={{Balanced Gray codes}},
  author={Bhat, G. S. and Savage, C. D.},
  journal={Electronic Journal of Combinatorics},
  volume={3},
  number={1},
  pages={R25},
  year={1996}
}


@inproceedings{1646158,
 author = {Bj{\o}rklund, Truls A. and Grimsmo, Nils and Gehrke, Johannes and Torbj{\o}rnsen, \Oystein},
 title = {Inverted indexes vs. bitmap indexes in decision support systems},
 booktitle = {CIKM '09},
 year = {2009},
 pages = {1509--1512}
 }
 
 @conference{yan2009inverted,
  title={Inverted index compression and query processing with optimized document ordering},
  author={Yan, H. and Ding, S. and Suel, T.},
  booktitle={WWW '09},
  pages={401--410},
  year={2009}}
  
 @inproceedings{1772723,
 author = {Ding, Shuai and Attenberg, Josh and Suel, Torsten},
 title = {Scalable techniques for document identifier assignment in inverted indexes},
 booktitle = {WWW '10},
 publisher = {ACM},
  address = {New York, NY, USA},
 year = {2010},
 pages = {311--320}
 }
 
 @inproceedings{1692916,
 author = {O'Neil, Patrick and O'Neil, Elizabeth and Chen, Xuedong and Revilak, Stephen},
 title = {The Star Schema Benchmark and Augmented Fact Table Indexing},
 booktitle = {TPCTC 2009},
 year = {2009},
 pages = {237--252} }
 
@inproceedings{1367550,
 author = {Zhang, Jiangong and Long, Xiaohui and Suel, Torsten},
 title = {Performance of compressed inverted list caching in search engines},
 booktitle = {WWW '08},
 year = {2008},
 pages = {387--396}
 } 
 
 @book{323905,
 author = {Witten, Ian H. and Moffat, Alistair and Bell, Timothy C.},
 title = {Managing gigabytes (2nd ed.): compressing and indexing documents and images},
 year = {1999},
 isbn = {1-55860-570-3},
 publisher = {Morgan Kaufmann Publishers Inc.},
 address = {San Francisco, CA, USA},
 }
 
 @article{1034897,
 author = {Anh, Vo Ngoc and Moffat, Alistair},
 title = {Inverted Index Compression Using Word-Aligned Binary Codes},
 journal = {Information Retrieval},
 volume = {8},
 number = {1},
 year = {2005},
 issn = {1386-4564},
 pages = {151--166}
 }
 
 @conference{blandford2002index,
  title={Index compression through document reordering},
  author={Blandford, D. and Blelloch, G.},
  booktitle={DCC 2002},
  pages={342--351},
  year={2002}
}
 @article{763298,
 author = {Shieh, Wann-Yun and Chen, Tien-Fu and Shann, Jean Jyh-Jiun and Chung, Chung-Ping},
 title = {Inverted file compression through document identifier reassignment},
 journal = {Inf. Process. Manage.},
 volume = {39},
 number = {1},
 year = {2003},
 issn = {0306-4573},
 pages = {117--131}
 }
 
 @inproceedings{1009046,
 author = {Silvestri, Fabrizio and Orlando, Salvatore and Perego, Raffaele},
 title = {Assigning identifiers to documents to enhance the clustering property of fulltext indexes},
 booktitle = {SIGIR '04},
 year = {2004},
 pages = {305--312}}
 
 
 @article{blanco2005document,
  title={Document identifier reassignment through dimensionality reduction},
  author={Blanco, R. and Barreiro, A.},
  journal={Advances in Information Retrieval},
  pages={375--387},
  volume={3408},
  year={2005},
  publisher={Springer}
} 
@article{blanco2006tsp,
  title={{TSP and cluster-based solutions to the reassignment of document identifiers}},
  author={Blanco, R. and Barreiro, A.},
  journal={Information Retrieval},
  volume={9},
  number={4},
  pages={499--517},
  year={2006},
  publisher={Springer}
}
@inproceedings{1763668,
 author = {Silvestri, Fabrizio},
 title = {Sorting out the document identifier assignment problem},
 booktitle = {ECIR'07},
 year = {2007},
 isbn = {978-3-540-71494-1},
 pages = {101--112}
}


@conference{walder2009benchmarking,
  title={{Benchmarking Coding Algorithms for the R-tree Compression}},
  author={Walder, J. and Kr{\'a}tk{\`y}, M. and Baca, R.},
  booktitle={Proceedings of the Dateso 2009 Annual International Workshop on Databases, Texts, Specifications and Objects},
  year={2009},
  pages={32--43}
}

@article{zobel2006inverted,
  title={Inverted files for text search engines},
  author={Zobel, J. and Moffat, A.},
  journal={ACM Computing Surveys},
  volume={38},
  number={2},
  pages={6},
  year={2006},
  publisher={ACM}
}
@conference{wu2008breaking,
  title={Breaking the curse of cardinality on bitmap indexes},
  author={Wu, K. and Stockinger, K. and Shoshani, A.},
  booktitle={SSDM '08},
  pages={348--365},
  year={2008},
  organization={Springer}
}

@article{necir2010data,
  title={{A data mining approach for efficient selection bitmap join index}},
  author={Necir, H.},
  journal={International Journal of Data Mining, Modelling and Management},
  volume={2},
  number={3},
  pages={238--251},
  year={2010},
  publisher={Inderscience}
}
@article{bellatreche2008data,
  title={{A data mining approach for selecting bitmap join indices}},
  author={Bellatreche, L. and Missaoui, R. and Necir, H. and Drias, H.},
  journal={Journal of Computing Science and Engineering},
  volume={2},
  number={1},
  pages={206--223},
  year={2008}
}
@inproceedings{1646083,
 author = {Madduri, Kamesh and Wu, Kesheng},
 title = {Efficient joins with compressed bitmap indexes},
 booktitle = {CIKM '09},
 year = {2009},
 pages = {1017--1026}
 }
 @InCollection{johnsonmcgeoch1997,
title={The Traveling Salesman Problem: A Case Study in Local Optimization},
author={David S. Johnson and Lyle A. McGeoch},
booktitle={Local Search in Combinatorial Optimization},
editor     ={E. H. L. Aarts and J. K. Lenstra},
pages={ 215--310},
year={1997},
publisher={John Wiley and Sons},
address={Hoboken, NJ, USA},
note={\url{http://akpublic.research.att.com/~dsj/papers/TSPchapter.pdf} (Last checked 07-10-2010)}
 }
 
 @book{1744275,
 author = {Reinelt, Gerhard},
 title = {The traveling salesman: computational solutions for TSP applications},
 year = {1994},
 isbn = {3-540-58334-3},
 publisher = {Springer-Verlag},
 address = {Berlin, Heidelberg},
 } 

    @article{karp1977,
     title = {Probabilistic Analysis of Partitioning Algorithms for the Traveling-Salesman Problem in the Plane},
     author = {Karp, Richard M.},
     journal = {Mathematics of Operations Research},     volume = {2},
     number = {3},
     pages = {209--224},     year = {1977}    }
        
    @inproceedings{DBLP:conf/vldb/AgarwalADGNRS96,
  author    = {Sameet Agarwal and
               Rakesh Agrawal and
               Prasad Deshpande and
               Ashish Gupta and
               Jeffrey F. Naughton and
               Raghu Ramakrishnan and
               Sunita Sarawagi},
  title     = {On the Computation of Multidimensional Aggregates},
  booktitle = {VLDB'96},
  publisher={Morgan Kaufmann Publishers Inc.},
  address = {San Francisco, CA, USA},
  year      = {1996},
  pages     = {506--521}
}

@inproceedings{1807094,
 author = {Kane, Daniel M. and Nelson, Jelani and Woodruff, David P.},
 title = {An optimal algorithm for the distinct elements problem},
 booktitle = {PODS '10},
 publisher={ACM},
  address = {New York, NY, USA},
 year = {2010},
 pages = {41--52}
 }
@article{1320134,
 author = {Welch, T. A.},
 title = {A Technique for High-Performance Data Compression},
 journal = {Computer},
 volume = {17},
 number = {6},
 year = {1984},
 pages = {8--19}
 }
@article{ziv1978compression,
  title={{Compression of individual sequences via variable-rate coding}},
  author={Ziv, J. and Lempel, A.},
  journal={IEEE Transactions on Information Theory},
  volume={24},
  number={5},
  pages={530--536},
  year={1978},
  publisher={Citeseer}
}
@conference{bellatreche2007pruning,
  title={{Pruning search space of physical database design}},
  author={Bellatreche, L. and Boukhalfa, K. and Mohania, M.},
  booktitle={DEXA'07},
  pages={479--488},
  year={2007}
}

@INPROCEEDINGS{143840, 
author={Graefe, G. and Shapiro, L.D.}, 
booktitle={Applied Computing, 1991., [Proceedings of the 1991] Symposium on}, title={Data compression and database performance}, 
year={1991}, 
month=apr, 
volume={}, 
number={}, 
pages={22 -27}, 
keywords={compressed data;data compression;data management;database performance;decompressed data;network bandwidth;query processing algorithms;storage space;data compression;database management systems;performance evaluation;}, 
doi={10.1109/SOAC.1991.143840}, 
ISSN={},}

@article{bentley2001data,
  title={{Data compression with long repeated strings}},
  author={Bentley, J. and McIlroy, D.},
  journal={Information Sciences},
  volume={135},
  number={1-2},
  pages={1--11},
  year={2001},
  publisher={Elsevier}
}



@InProceedings{cui:context-preserving,
  author =       {Weiwei Cui and Yingcai Wu and Shixia Liu and Furu Wei and M. X. Zhou and Huamin Qu},
  title =        {Context Preserving Dynamic Word Cloud Visualization},
  booktitle = {PacificVis'10},
  pages =     {121--128},
  year =      2010,
  month =     mar,
  organization = {IEEE}}



@Misc{elak:model-humanity-globe,
  author =    {Omar {El Akkad}},
  title =     {Supercomputers Seek to `Model Humanity'},
  howpublished = {The Globe and Mail, 18 June 2010}}

@conference{deveaux2007adaptive,
  title={{Adaptive Tuple Differential Coding}},
  author={Deveaux, J.P. and Rau-Chaplin, A. and Zeh, N.},
  booktitle={DEXA'07},
  pages={109--119},
  year={2007}
}

@Article{mart:using-textual,
  author =       {M. J. {Martin-Bautista} and C. Molina and
E. Tejeda and M. {Amparo Vila}},
  title =        {Using Textual Dimensions in Data Warehousing Processes},
  journal =      {Communications in Computer and Information Science},
  year =         2010,
  volume =    81,
  pages =     {158--167}}
  
  @inproceedings{644113,
 author = {Fagin, Ronald and Kumar, Ravi and Sivakumar, D.},
 title = {Comparing top k lists},
 booktitle = {SODA '03},
 year = {2003},
 pages = {28--36}
 }


@Book{boum:pentaho-solutions,
  author =    {Roland Bouman and Jos {van Dongen}},
  title =        {Pentaho Solutions: Business Intelligence and Data
Warehousing with {Pentaho} and {MySQL} },
  publisher =    {Wiley},
  isbn =       {978-0470484326}, 
  year =         2009}


@Book{cast:kettle-solutions,
  author =    {Matt Casters and Roland Bouman and Jos {van Dongen}},
  title =        {Pentaho {Kettle} Solutions: Building Open Source {ETL} Solutions with {Pentaho} Data Integration},
  publisher =    {Wiley},
  year =         2010,
  isbn =         {978-0470635179}}

@Book{gorm:pentaho-reporting-book,
  author =    {Will Gorman},
  title =        {Pentaho Reporting 3.5 for {Java} Developers},
  publisher =    {Packt Publishing},
  year =         2009,
  isbn =         {978-1847193193}
}

@book{kimball2002dwt,
  title={The data warehouse toolkit: The Complete Guide to Dimensional Modeling},
  author={Kimball, Ralph and Ross, Margy},
  year={2002},
  edition = {2nd},
  publisher={Wiley},
  isbn = {978-0471200246}
}

@Book{inmo:building-dw,
  author =    {W.H. Inmon},
  title =        {Building the Data Warehouse},
  publisher =    {Wiley},
  year =         2005,
  edition =   {4th},
  isbn = {978-0764599446}
}


@Misc{1key:dw-explanations,
  author =    {1keydata.com},
  title =     {Data Warehousing: A Look at Business Intelligence and Data Warehouse},
  howpublished = {\url{http://www.1keydata.com/datawarehousing/datawarehouse.html}},
  year =      2010,
  note =      {last checked 4-nov-2010}}


@Book{kimb:dw-lifecycle-toolkit,
  author =    {Ralph Kimball and Margy Ross and Warren Thornthwaite and Joy Mundy and Bob Becker},
  title =        {The Data Warehouse Lifecycle Toolkit},
  publisher =    {Wiley},
  year =         2008,
  edition =   {2nd},
  extranote =    {probably more emphasis on business/mgmt},
  isbn =         {978-0470149775}
}


@article{Anh:2010:ICU:1712666.1712668,
 author = {Anh, Vo Ngoc and Moffat, Alistair},
 title = {Index compression using 64-bit words},
 journal = {Softw. Pract. Exper.},
 volume = {40},
 issue = {2},
 year = {2010}
 }


 @article{datta2002querying,
   title={{Querying compressed data in data warehouses}},
   author={Datta, A. and Thomas, H.},
   journal={Information Technology and Management},
   volume={3},
   number={4},
   pages={353--386},
   year={2002}
 }

 @article{Westmann:2000:IPC:362084.362137,
  author = {Westmann, Till and Kossmann, Donald and Helmer, Sven and Moerkotte, Guido},
  title = {The implementation and performance of compressed databases},
  journal = {SIGMOD Record},
  volume = {29},
  issue = {3},
  month = {September},
  year = {2000},
  pages = {55--67} }
  @article{Bhattacharjee:2009:EIC:1687553.1687573-----duplicateusedb2luw2009instead,
   author = {Bhattacharjee, Bishwaranjan and Lim, Lipyeow and Malkemus, Timothy and Mihaila, George and Ross, Kenneth and Lau, Sherman and McArthur, Cathy and Toth, Zoltan and Sherkat, Reza},
   title = {Efficient index compression in {DB2 LUW}},
   journal = {Proc. VLDB Endow.},
   volume = {2},
   issue = {2},
   month = {August},
   year = {2009}
  }
@ARTICLE{1451833, 
author={Alsberg, P.A.}, 
journal={Proceedings of the IEEE}, 
title={Space and time savings through large data base compression and dynamic restructuring}, 
year={1975}, 
month={August}, 
volume={63}, 
number={8}, 
pages={ 1114 - 1122}, 
keywords={}, 
doi={10.1109/PROC.1975.9903}, 
ISSN={0018-9219},}
  @incollection {springerlink:10.1007/978-3-642-15105-7_10,
     author = {Lemke, Christian and Sattler, Kai-Uwe and Faerber, Franz and Zeier, Alexander},
     affiliation = {SAP AG, Walldorf, Germany},
     title = {Speeding Up Queries in Column Stores},
     booktitle = {Data Warehousing and Knowledge Discovery},
     series = {Lecture Notes in Computer Science},
     omittingeditor = {Bach Pedersen, Torben and Mohania, Mukesh and Tjoa, A},
     publisher = {Springer Berlin / Heidelberg},
     pages = {117--129},
     volume = {6263},
     year = {2010}
  }

@Article{rome:mdbe,
  author =       {Oscar Romero and Alberto Abell\'o},
  title =        {Automatic Validation of Requirements to Support
Multidimensional Design},
  journal =      {Data and Knowledge Engineering},
  year =         2010,
  volume =    69,
  pages =     {917--942}}



@InProceedings{dehn:dolap07,
  author =       {Frank Dehne and Todd Eavis and Andrew {Rau-Chaplin}},
  title =        {Efficient Computation of View Subsets},
  booktitle = {Proceedings, DOLAP'07},
  pages =     {65--72},
  year =      2007,
  publisher = {ACM}}



@Book{wrem:dwolap-book,
  editor =    {Robert Wrembel and Christian Koncillia},
  title =        {Data warehouses and {OLAP}: concepts, architectures, and solutions},
  publisher =    {IRM Press},
  year =         2007}


@article{onei:multi-table-joins,
 author = {O'Neil, Patrick and Graefe, Goetz},
 title = {Multi-table joins through bitmapped join indices},
 journal = {SIGMOD Rec.},
 volume = 24,
 issue = 3,
 month = {September},
 year = 1995,
 issn = {0163-5808},
 pages = {8--11},
 numpages = 4,
 acmid = 212001,
 publisher = {ACM},
 address = {New York, NY, USA},
}



@InProceedings{thom:pygrametl,
  author =       {Christian Thompsen and Torben Bach Pedersen},
  title =        {{pygrametl}: A Powerful Programming Framework for
 {Extract-Transform-Load} Programming},
  booktitle = {Proceedings, DOLAP'09},
  pages =     {49--56},
  year =      2009,
  publisher = {ACM}}

@InProceedings{pede:warehousing-world,
  author =       {Torben Bach Pedersen},
  title =        {Warehousing the World---A Few Remaining Challenges},
  booktitle = {Proceedings, DOLAP'07},
  pages =     {101--102},
  year =      2007,
  publisher = {ACM}}

@InProceedings{bell:yaa,
  author =       {Ladjel Bellatreche and Kamel Boukhalfa},
  title =        {Yet Another Algorithms for Selecting Bitmap Join Indexes},
  booktitle = {Proceedings, DaWaK'10 (LNCS 6263)},
  pages =     {105--116},
  year =      2010,
  publisher = {Springer-Verlag}}


@Article{pere:contextualizingDW,
  author =       {Juan Manuel {P\'erez-Mart\'{\i}nez} and Rafael {Berlange-Llavori} and Maria Jos\'e {Aramburu-Cabo} and Torben Bach Pedersen},
  title =        {Contextualizing data warehouses with documents},
  journal =      {Decision Support Systems},
  year =         2008,
  volume =    45,
  pages =     {77-94}} 



@Misc{mago:open-source-dw,
  author =    {Roger Magoulis},
  title =     {The Open Source Data Warehouse},
  howpublished = {slides online from talk at MySQL Users Conference,\url{http://www.mysqluc.com/cs/mysqluc2005/view/e_sess/6196}},
  year =      2005}

@Article{pede:md-db-tech,
  author = 	 "Torben Bach Pedersen and Christian S. Jensen",
  title = 	 "Multidimensional Database Technology",
  journal = 	 {{IEEE Computer}},
  year = 	 2001,
  pages =	 {{40--46}},
  month =	 "December",
}

@Article{chau:db-tech-dss,
  author = 	 "Surajit Chaudhuri and others",
  title = 	 "Database Technology for Decision Support Systems",
  journal = 	 {{IEEE Computer}},
  year = 	 2001,
  pages =	 {{48--55}},
  month =	 "December",
}

@TechReport{sara:datacube,
  author =       {Sunita Sarawagi and Rakesh Agrawal and Ashish Gupta},
  title =        {On Computing the Data Cube},
  institution =  {IBM Almaden Research Center},
  year =         1996,
  note =      {\url{http://www.almaden.ibm.com/cs/projects/iis/hdb/Publications/papers/cube_rj.pdf}}}



@Article{stam:survey-attribution,
  author =       {Stamatatos, Efstathios},
  title =        {A survey of modern authorship attribution methods},
  journal =      {Journal of the American Society for Information Science and Technology},
  year =         2009,
  volume =    60,
  number =    3,
  pages =     {538--556}}

@Misc{lzolib,
  author =       "Markus Franz Xaver Johannes Oberhumer",
  title =        {{LZO real-time data compression library}},
  howpublished = "online: \url{http://www.oberhumer.com/opensource/lzo/}",
  year =         2010,
  note =         {checked 2010-12-10}
}
@Misc{gailly2004zlib,
  title={{Zlib compression library}},
  author={Jean-loup Gailly and Mark Adler},
  howpublished = "online: \url{http://www.zlib.net/}",
  year={2004}
}



@Article{gold:maxflow-pcomplete,
  author =       {L. M. Goldschlager and R. A. Shaw and J. Staples},
  title =        {The maximum flow problem is log space complete for {P}},
  journal =      {Theoretical Computer Science},
  year =         1982,
  volume =    21,
  pages =     {105-111}}

@article{spiegler1985storage,
  title={Storage and retrieval considerations of binary data bases},
  author={Spiegler, I. and Maayan, R.},
  journal={Information Processing \& Management},
  volume={21},
  number={3},
  pages={233--254},
  issn={0306-4573},
  year={1985},
  publisher={Elsevier}
}
@article{Witten:1987:ACD:214762.214771,
 author = {Witten, Ian H. and Neal, Radford M. and Cleary, John G.},
 title = {Arithmetic coding for data compression},
 journal = {Commun. ACM},
 volume = {30},
 issue = {6},
 month = {June},
 year = {1987},
 issn = {0001-0782},
 pages = {520--540},
 numpages = {21},
 url = {http://doi.acm.org/10.1145/214762.214771},
 doi = {http://doi.acm.org/10.1145/214762.214771},
 acmid = {214771},
 publisher = {ACM},
 address = {New York, NY, USA},
} 
@article{Moffat:1998:ACR:290159.290162,
 author = {Moffat, Alistair and Neal, Radford M. and Witten, Ian H.},
 title = {Arithmetic coding revisited},
 journal = {ACM Trans. Inf. Syst.},
 volume = {16},
 issue = {3},
 month = {July},
 year = {1998},
 issn = {1046-8188},
 pages = {256--294},
 numpages = {39},
 url = {http://doi.acm.org/10.1145/290159.290162},
 doi = {http://doi.acm.org/10.1145/290159.290162},
 acmid = {290162},
 publisher = {ACM},
 address = {New York, NY, USA},
 keywords = {approximate coding, arithmetic coding, text compression, word-based model},
} 
@article{effelsberg1984principles,
  title={{Principles of database buffer management}},
  author={Effelsberg, W. and Haerder, T.},
  journal={ACM Transactions on Database Systems (TODS)},
  volume={9},
  number={4},
  pages={560--595},
  issn={0362-5915},
  year={1984},
  publisher={ACM}
}
@Book{gree:pcomplete-book,
  author =    {Raymond Greenlaw and H. James Hoover and Walter L. Ruzzo},
  title =        {Limits to Parallel Computation: {P}-completeness Theory },
  publisher =    {Oxford University Press},
  year =         1995}

@article{Marcelloni20101924,
title = "Enabling energy-efficient and lossy-aware data compression in wireless sensor networks by multi-objective evolutionary optimization",
journal = "Information Sciences",
volume = "180",
number = "10",
pages = "1924 - 1941",
year = "2010",
note = "Special Issue on Intelligent Distributed Information Systems",
issn = "0020-0255",
doi = "DOI: 10.1016/j.ins.2010.01.027",
url = "http://www.sciencedirect.com/science/article/B6V0C-4Y95RRK-5/2/e05bf3d54bd169badba5043926d3240f",
author = "Francesco Marcelloni and Massimo Vecchio",
keywords = "Wireless sensor networks",
keywords = "Data compression",
keywords = "Multi-objective evolutionary algorithms",
keywords = "Energy efficiency",
keywords = "Signal processing"
}

@article{He20093162,
title = "Fine-grained updates in database management systems for flash memory",
journal = "Information Sciences",
volume = "179",
number = "18",
pages = "3162 - 3181",
year = "2009",
note = "",
issn = "0020-0255",
doi = "DOI: 10.1016/j.ins.2009.05.010",
url = "http://www.sciencedirect.com/science/article/B6V0C-4WBK7G6-1/2/640cde7ab9e39d08b18b69e4a4cface2",
author = "Zhen He and Prakash Veeraraghavan",
keywords = "Flash memory",
keywords = "Database",
keywords = "Caching",
keywords = "Buffer replacement",
keywords = "Vertical partitioning",
keywords = "Database optimization"
}

@inproceedings{Sismanis:2006:GES:1182635.1164187,
 author = {Sismanis, Yannis and Brown, Paul and Haas, Peter J. and Reinwald, Berthold},
 title = {GORDIAN: efficient and scalable discovery of composite keys},
 booktitle = {Proceedings of the 32nd international conference on Very large data bases},
 series = {VLDB '06},
 year = {2006},
 location = {Seoul, Korea},
 pages = {691--702},
 numpages = {12},
 url = {http://portal.acm.org/citation.cfm?id=1182635.1164187},
 acmid = {1164187},
 publisher = {VLDB Endowment},
} 

@article{huhtala1999tane,
  title={{TANE: An efficient algorithm for discovering functional and approximate dependencies}},
  author={Huhtala, Y. and Karkkainen, J. and Porkka, P. and Toivonen, H.},
  journal={The Computer Journal},
  volume={42},
  number={2},
  pages={100},
  issn={0010-4620},
  year={1999},
  publisher={Br Computer Soc}
}

@article{bohm2004k,
  title={{The k-nearest neighbour join: Turbo charging the kdd process}},
  author={B{\\"o}hm, C. and Krebs, F.},
  journal={Knowledge and Information Systems},
  volume={6},
  number={6},
  pages={728--749},
  issn={0219-1377},
  year={2004},
  publisher={Springer}
}
@INPROCEEDINGS{5447837, 
author={Bin Yao and Feifei Li and Kumar, P.}, 
booktitle={2010 IEEE 26th International Conference on Data Engineering (ICDE)}, title={K nearest neighbor queries and {kNN-Joins} in large relational databases (almost) for free}, 
year={2010}, 
month=march,
pages={4--15}, }

@article{guting2000foundation,
  title={{A foundation for representing and querying moving objects}},
  author={G{\\"u}ting, R.H. and B{\\"o}hlen, M.H. and Erwig, M. and Jensen, C.S. and Lorentzos, N.A. and Schneider, M. and Vazirgiannis, M.},
  journal={ACM Transactions on Database Systems (TODS)},
  volume={25},
  number={1},
  pages={42},
  issn={0362-5915},
  year={2000},
  publisher={ACM}
}

@article{beckmann1990r,
  title={{The R*-tree: an efficient and robust access method for points and rectangles}},
  author={Beckmann, N. and Kriegel, H.P. and Schneider, R. and Seeger, B.},
  journal={ACM SIGMOD Record},
  volume={19},
  number={2},
  pages={322--331},
  issn={0163-5808},
  year={1990},
  publisher={ACM}
}
@Manual{hita:patiencedisk,
  title =        {Deskstar {P7K500}},
  author =    {{Hitachi Global Storage Technologies}},
  note =      {\url{http://www.hitachigst.com/tech/techlib.nsf/techdocs/30C3F554C477835B86257377006E61A0/$file/HGST_Deskstar_P7K500_DS_FINAL.pdf} (Last checked 06-09-2010)},
 othernote ="Emacs syntax checker confused by this entry, so owen will always
 move it to the end of the bibtex file",
year={2009}
}

@article{DBLP:journals/tods/WuOS06,
  author    = {Kesheng Wu and
               Ekow J. Otoo and
               Arie Shoshani},
  title     = {Optimizing bitmap indices with efficient compression},
  journal   = {ACM Trans. Database Syst.},
  volume    = {31},
  number    = {1},
  year      = {2006},
  pages     = {1-38},
  ee        = {http://doi.acm.org/10.1145/1132863.1132864},
  bibsource = {DBLP, http://dblp.uni-trier.de}
}

@ARTICLE{Ziv77auniversal,
    author = {Jacob Ziv and Abraham Lempel},
    title = {A universal algorithm for sequential data compression},
    journal = {IEEE TRANSACTIONS ON INFORMATION THEORY},
    year = {1977},
    volume = {23},
    number = {3},
    pages = {337--343}
}